[{"key": "42c027e4ff9730fbb3de84c1af0d2c506e41c3e4", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.6992544118075613, "ground_truth": 0}, {"key": "42c027e4ff9730fbb3de84c1af0d2c506e41c3e4", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.2553436545324885, "ground_truth": 0}, {"key": "42c027e4ff9730fbb3de84c1af0d2c506e41c3e4", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.5736784312644658, "ground_truth": 0}, {"key": "42c027e4ff9730fbb3de84c1af0d2c506e41c3e4", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.32082132170397326, "ground_truth": 0}, {"key": "42c027e4ff9730fbb3de84c1af0d2c506e41c3e4", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.22678362620952877, "ground_truth": 0}, {"key": "ee8871b15c50d0db17b0179a6d2beab35065f1e9", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.548673470356335, "ground_truth": 0}, {"key": "ee8871b15c50d0db17b0179a6d2beab35065f1e9", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.5019531331018249, "ground_truth": 0}, {"key": "ee8871b15c50d0db17b0179a6d2beab35065f1e9", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.28937170305152166, "ground_truth": 0}, {"key": "ee8871b15c50d0db17b0179a6d2beab35065f1e9", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.32252600579691343, "ground_truth": 0}, {"key": "ee8871b15c50d0db17b0179a6d2beab35065f1e9", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.35577487312218337, "ground_truth": 0}, {"key": "06352019a19ae31e527f37f7571c6dd7f0c5da37", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.12765262289443963, "ground_truth": 0}, {"key": "06352019a19ae31e527f37f7571c6dd7f0c5da37", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.15610490149220838, "ground_truth": 0}, {"key": "06352019a19ae31e527f37f7571c6dd7f0c5da37", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.225416602635239, "ground_truth": 0}, {"key": "06352019a19ae31e527f37f7571c6dd7f0c5da37", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.10594827931433726, "ground_truth": 0}, {"key": "06352019a19ae31e527f37f7571c6dd7f0c5da37", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.11596071581769822, "ground_truth": 0}, {"key": "24521a2abb2e1f5e34e6824e0f9e56904a2b0e88", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.43206339300361657, "ground_truth": 0}, {"key": "24521a2abb2e1f5e34e6824e0f9e56904a2b0e88", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.10894503861644451, "ground_truth": 0}, {"key": "24521a2abb2e1f5e34e6824e0f9e56904a2b0e88", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.33982763766501195, "ground_truth": 0}, {"key": "24521a2abb2e1f5e34e6824e0f9e56904a2b0e88", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.23091976063661931, "ground_truth": 0}, {"key": "24521a2abb2e1f5e34e6824e0f9e56904a2b0e88", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.5755880119017464, "ground_truth": 0}, {"key": "7fe70cc8b12fab2d0a258fababf7d9c6b5e1262a", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.6740504768627621, "ground_truth": 0}, {"key": "7fe70cc8b12fab2d0a258fababf7d9c6b5e1262a", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.44360042146916023, "ground_truth": 0}, {"key": "7fe70cc8b12fab2d0a258fababf7d9c6b5e1262a", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.4054487294525705, "ground_truth": 0}, {"key": "7fe70cc8b12fab2d0a258fababf7d9c6b5e1262a", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.49218814561798424, "ground_truth": 0}, {"key": "7fe70cc8b12fab2d0a258fababf7d9c6b5e1262a", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.5907791988702819, "ground_truth": 0}, {"key": "a1ebb8bb4d370a1fdf28769206d572be60642d70", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.372048789736025, "ground_truth": 0}, {"key": "a1ebb8bb4d370a1fdf28769206d572be60642d70", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.16238001858314707, "ground_truth": 0}, {"key": "a1ebb8bb4d370a1fdf28769206d572be60642d70", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.6224593267459505, "ground_truth": 0}, {"key": "a1ebb8bb4d370a1fdf28769206d572be60642d70", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.455198602595427, "ground_truth": 0}, {"key": "a1ebb8bb4d370a1fdf28769206d572be60642d70", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.27512972001934843, "ground_truth": 0}, {"key": "7c0e61ac829a3b3b653e2e3e7536cc4881d1f264", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.13386749680024493, "ground_truth": 0}, {"key": "7c0e61ac829a3b3b653e2e3e7536cc4881d1f264", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.22541660898795715, "ground_truth": 0}, {"key": "7c0e61ac829a3b3b653e2e3e7536cc4881d1f264", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.21866937349786192, "ground_truth": 0}, {"key": "7c0e61ac829a3b3b653e2e3e7536cc4881d1f264", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.09807932349409901, "ground_truth": 0}, {"key": "7c0e61ac829a3b3b653e2e3e7536cc4881d1f264", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.3363310469534198, "ground_truth": 0}, {"key": "f0d73bdab711763e745cdc75850861c9018f235d", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.4054487434852642, "ground_truth": 0}, {"key": "f0d73bdab711763e745cdc75850861c9018f235d", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.2281565072316535, "ground_truth": 0}, {"key": "f0d73bdab711763e745cdc75850861c9018f235d", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.12940273444571312, "ground_truth": 0}, {"key": "f0d73bdab711763e745cdc75850861c9018f235d", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.3191213912595541, "ground_truth": 0}, {"key": "f0d73bdab711763e745cdc75850861c9018f235d", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.1634454388820415, "ground_truth": 0}, {"key": "5e22bbfc7232418b8d2dd646b952e404df5bd048", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.7813306391428124, "ground_truth": 0}, {"key": "5e22bbfc7232418b8d2dd646b952e404df5bd048", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.6224593350562049, "ground_truth": 0}, {"key": "5e22bbfc7232418b8d2dd646b952e404df5bd048", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.4629586084572184, "ground_truth": 0}, {"key": "5e22bbfc7232418b8d2dd646b952e404df5bd048", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.6169358146325136, "ground_truth": 0}, {"key": "5e22bbfc7232418b8d2dd646b952e404df5bd048", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.752012552983542, "ground_truth": 0}, {"key": "613d6311ec2c1985bd44707d1796d275452fe156", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.20817894151427127, "ground_truth": 0}, {"key": "613d6311ec2c1985bd44707d1796d275452fe156", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.16885695829372618, "ground_truth": 0}, {"key": "613d6311ec2c1985bd44707d1796d275452fe156", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.2043418956081162, "ground_truth": 0}, {"key": "613d6311ec2c1985bd44707d1796d275452fe156", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.20561503883318144, "ground_truth": 0}, {"key": "613d6311ec2c1985bd44707d1796d275452fe156", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.4225046332133351, "ground_truth": 0}, {"key": "017d27d00eb43678c15cb4a8dd4723a035323219", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.2991051877878982, "ground_truth": 0}, {"key": "017d27d00eb43678c15cb4a8dd4723a035323219", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.2909808564430499, "ground_truth": 0}, {"key": "017d27d00eb43678c15cb4a8dd4723a035323219", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.17328821307031467, "ground_truth": 0}, {"key": "017d27d00eb43678c15cb4a8dd4723a035323219", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.1699562376001232, "ground_truth": 0}, {"key": "017d27d00eb43678c15cb4a8dd4723a035323219", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.640635873888379, "ground_truth": 0}, {"key": "85f55a3e0dd672857aaaaa80954934a57b7a2fbf", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.2422056274024481, "ground_truth": 0}, {"key": "85f55a3e0dd672857aaaaa80954934a57b7a2fbf", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.27202457576854455, "ground_truth": 0}, {"key": "85f55a3e0dd672857aaaaa80954934a57b7a2fbf", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.23934933473999853, "ground_truth": 0}, {"key": "85f55a3e0dd672857aaaaa80954934a57b7a2fbf", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.2538610216512652, "ground_truth": 0}, {"key": "85f55a3e0dd672857aaaaa80954934a57b7a2fbf", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.2658804804428587, "ground_truth": 0}, {"key": "77d7c8cf2a9432e395d629371a12790c563c19f7", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.3259495247616708, "ground_truth": 0}, {"key": "77d7c8cf2a9432e395d629371a12790c563c19f7", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.5813031034340723, "ground_truth": 0}, {"key": "77d7c8cf2a9432e395d629371a12790c563c19f7", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.5253688220239328, "ground_truth": 0}, {"key": "77d7c8cf2a9432e395d629371a12790c563c19f7", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.45907615386523304, "ground_truth": 0}, {"key": "77d7c8cf2a9432e395d629371a12790c563c19f7", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.7295197656737504, "ground_truth": 0}, {"key": "35f0e33de7923036a97ac245d899f990bda5e242", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.27512972430273225, "ground_truth": 0}, {"key": "35f0e33de7923036a97ac245d899f990bda5e242", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.6039318341507177, "ground_truth": 0}, {"key": "35f0e33de7923036a97ac245d899f990bda5e242", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.457136734463325, "ground_truth": 0}, {"key": "35f0e33de7923036a97ac245d899f990bda5e242", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.35220179181076927, "ground_truth": 0}, {"key": "35f0e33de7923036a97ac245d899f990bda5e242", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.3904758399546555, "ground_truth": 0}, {"key": "2ad31cae96512af5105b9b23f9b681dc732b2605", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.5486734879208378, "ground_truth": 0}, {"key": "2ad31cae96512af5105b9b23f9b681dc732b2605", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.4035668588194874, "ground_truth": 0}, {"key": "2ad31cae96512af5105b9b23f9b681dc732b2605", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.537041367280445, "ground_truth": 0}, {"key": "2ad31cae96512af5105b9b23f9b681dc732b2605", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.39793840741375014, "ground_truth": 0}, {"key": "2ad31cae96512af5105b9b23f9b681dc732b2605", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.4282334010037718, "ground_truth": 0}, {"key": "0d43b97000ff852282c89d8d105e41495c0ee9bd", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.2538610132075555, "ground_truth": 0}, {"key": "0d43b97000ff852282c89d8d105e41495c0ee9bd", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.13386748806444687, "ground_truth": 0}, {"key": "0d43b97000ff852282c89d8d105e41495c0ee9bd", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.1175721364087374, "ground_truth": 0}, {"key": "0d43b97000ff852282c89d8d105e41495c0ee9bd", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.4668456029664582, "ground_truth": 0}, {"key": "0d43b97000ff852282c89d8d105e41495c0ee9bd", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.3557748799661253, "ground_truth": 0}, {"key": "bf0cd4ccacd4fe045995338f4c44d9cf18000226", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.41679664701436003, "ground_truth": 0}, {"key": "bf0cd4ccacd4fe045995338f4c44d9cf18000226", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.4263216024700873, "ground_truth": 0}, {"key": "bf0cd4ccacd4fe045995338f4c44d9cf18000226", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.2479874110774674, "ground_truth": 0}, {"key": "bf0cd4ccacd4fe045995338f4c44d9cf18000226", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.5253688040433275, "ground_truth": 0}, {"key": "bf0cd4ccacd4fe045995338f4c44d9cf18000226", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.324235393987258, "ground_truth": 0}, {"key": "2f43e9dfaa43ffbddbce339a8b6403ddce43b38a", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.14511536249093002, "ground_truth": 0}, {"key": "2f43e9dfaa43ffbddbce339a8b6403ddce43b38a", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.3090237056468115, "ground_truth": 0}, {"key": "2f43e9dfaa43ffbddbce339a8b6403ddce43b38a", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.24508500039634556, "ground_truth": 0}, {"key": "2f43e9dfaa43ffbddbce339a8b6403ddce43b38a", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.4941408940148454, "ground_truth": 0}, {"key": "2f43e9dfaa43ffbddbce339a8b6403ddce43b38a", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.4436004405907782, "ground_truth": 0}, {"key": "eb68bc51ed4fc727a1af058192a3fef0916c91e7", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.359364143522451, "ground_truth": 0}, {"key": "eb68bc51ed4fc727a1af058192a3fef0916c91e7", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.5292633824102009, "ground_truth": 0}, {"key": "eb68bc51ed4fc727a1af058192a3fef0916c91e7", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.6113819788961519, "ground_truth": 0}, {"key": "eb68bc51ed4fc727a1af058192a3fef0916c91e7", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.1871326907575644, "ground_truth": 0}, {"key": "eb68bc51ed4fc727a1af058192a3fef0916c91e7", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.40922078515093335, "ground_truth": 0}, {"key": "ad021a7924ee57491cee8576499ac196b1afeb23", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.148047189442277, "ground_truth": 0}, {"key": "ad021a7924ee57491cee8576499ac196b1afeb23", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.6169358111074945, "ground_truth": 0}, {"key": "ad021a7924ee57491cee8576499ac196b1afeb23", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.626124147600788, "ground_truth": 0}, {"key": "ad021a7924ee57491cee8576499ac196b1afeb23", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.4130035561945386, "ground_truth": 0}, {"key": "ad021a7924ee57491cee8576499ac196b1afeb23", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.575588010214611, "ground_truth": 0}, {"key": "9d7fc7fd9ffbfecb1c458b9929fa02e6c3538368", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.3191213886592831, "ground_truth": 0}, {"key": "9d7fc7fd9ffbfecb1c458b9929fa02e6c3538368", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.6688802539469344, "ground_truth": 0}, {"key": "9d7fc7fd9ffbfecb1c458b9929fa02e6c3538368", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.18952109975253748, "ground_truth": 0}, {"key": "9d7fc7fd9ffbfecb1c458b9929fa02e6c3538368", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.6370308069215356, "ground_truth": 0}, {"key": "9d7fc7fd9ffbfecb1c458b9929fa02e6c3538368", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.6477982165266521, "ground_truth": 0}, {"key": "30cb674030b01014d2c87b92f09152857e249631", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.31742627665183676, "ground_truth": 0}, {"key": "30cb674030b01014d2c87b92f09152857e249631", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.4436004252638914, "ground_truth": 0}, {"key": "30cb674030b01014d2c87b92f09152857e249631", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.3311197152680188, "ground_truth": 0}, {"key": "30cb674030b01014d2c87b92f09152857e249631", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.2814056014482214, "ground_truth": 0}, {"key": "30cb674030b01014d2c87b92f09152857e249631", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.5136684798986682, "ground_truth": 0}, {"key": "d41dc7fc05273a37f0aceaf4f3e35a187f12653e", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.37570648921674055, "ground_truth": 0}, {"key": "d41dc7fc05273a37f0aceaf4f3e35a187f12653e", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.24220562664953846, "ground_truth": 0}, {"key": "d41dc7fc05273a37f0aceaf4f3e35a187f12653e", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.45326183670447096, "ground_truth": 0}, {"key": "d41dc7fc05273a37f0aceaf4f3e35a187f12653e", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.42059959947609193, "ground_truth": 0}, {"key": "d41dc7fc05273a37f0aceaf4f3e35a187f12653e", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.36116472925061655, "ground_truth": 0}, {"key": "fbc6a4d0697b2a3e8b549dcb1f80a8ce7bf47e34", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.6424324706233573, "ground_truth": 0}, {"key": "fbc6a4d0697b2a3e8b549dcb1f80a8ce7bf47e34", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.7879311828316391, "ground_truth": 0}, {"key": "fbc6a4d0697b2a3e8b549dcb1f80a8ce7bf47e34", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.6548947246424406, "ground_truth": 0}, {"key": "fbc6a4d0697b2a3e8b549dcb1f80a8ce7bf47e34", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.34158249355714415, "ground_truth": 0}, {"key": "fbc6a4d0697b2a3e8b549dcb1f80a8ce7bf47e34", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.8164063927869194, "ground_truth": 0}, {"key": "0753a471e6908c35bcbc2daa37e21f3a8443b590", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.7956581115540166, "ground_truth": 0}, {"key": "0753a471e6908c35bcbc2daa37e21f3a8443b590", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.6688802777014485, "ground_truth": 0}, {"key": "0753a471e6908c35bcbc2daa37e21f3a8443b590", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.926303725681105, "ground_truth": 0}, {"key": "0753a471e6908c35bcbc2daa37e21f3a8443b590", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.7431679919656046, "ground_truth": 0}, {"key": "0753a471e6908c35bcbc2daa37e21f3a8443b590", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.7233094749954778, "ground_truth": 0}, {"key": "08450c1bc03472825196be1acb02ac0e13bef939", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.3998116499689646, "ground_truth": 0}, {"key": "08450c1bc03472825196be1acb02ac0e13bef939", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.5774953726886497, "ground_truth": 0}, {"key": "08450c1bc03472825196be1acb02ac0e13bef939", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.5640984868397287, "ground_truth": 0}, {"key": "08450c1bc03472825196be1acb02ac0e13bef939", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.7057850296401716, "ground_truth": 0}, {"key": "08450c1bc03472825196be1acb02ac0e13bef939", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.7233094665918788, "ground_truth": 0}, {"key": "7fa8d9beca50155fd3d71a9087a4311ce321c34b", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.48438006816622586, "ground_truth": 0}, {"key": "7fa8d9beca50155fd3d71a9087a4311ce321c34b", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.6039318396673501, "ground_truth": 0}, {"key": "7fa8d9beca50155fd3d71a9087a4311ce321c34b", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.4130035721556582, "ground_truth": 0}, {"key": "7fa8d9beca50155fd3d71a9087a4311ce321c34b", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.6808786212630781, "ground_truth": 0}, {"key": "7fa8d9beca50155fd3d71a9087a4311ce321c34b", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.30735801097362137, "ground_truth": 0}, {"key": "414a5b8ecbe189d2767c75b839775a1dcafaf4d3", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.2798285085745122, "ground_truth": 0}, {"key": "414a5b8ecbe189d2767c75b839775a1dcafaf4d3", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.10594827812933776, "ground_truth": 0}, {"key": "414a5b8ecbe189d2767c75b839775a1dcafaf4d3", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.11124121911053185, "ground_truth": 0}, {"key": "414a5b8ecbe189d2767c75b839775a1dcafaf4d3", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.07531230745016003, "ground_truth": 0}, {"key": "414a5b8ecbe189d2767c75b839775a1dcafaf4d3", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.23510838953433597, "ground_truth": 0}, {"key": "cac7a712935380d74410a7cba8d406235d51249a", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.33111973245835596, "ground_truth": 0}, {"key": "cac7a712935380d74410a7cba8d406235d51249a", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.550607375006096, "ground_truth": 0}, {"key": "cac7a712935380d74410a7cba8d406235d51249a", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.2704802385919101, "ground_truth": 0}, {"key": "cac7a712935380d74410a7cba8d406235d51249a", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.16132024036367792, "ground_truth": 0}, {"key": "cac7a712935380d74410a7cba8d406235d51249a", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.17106118817524582, "ground_truth": 0}, {"key": "e9093ca0a82f2aba28cd2762942c04177cfbb000", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.15713685144328934, "ground_truth": 0}, {"key": "e9093ca0a82f2aba28cd2762942c04177cfbb000", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.3998116181256936, "ground_truth": 0}, {"key": "e9093ca0a82f2aba28cd2762942c04177cfbb000", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.17553806761694024, "ground_truth": 0}, {"key": "e9093ca0a82f2aba28cd2762942c04177cfbb000", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.17895589150333294, "ground_truth": 0}, {"key": "e9093ca0a82f2aba28cd2762942c04177cfbb000", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.15304215511833374, "ground_truth": 0}, {"key": "55a6aabd120f0b18297f7efe22452f9b3aca0d8d", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.9278878041768076, "ground_truth": 0}, {"key": "55a6aabd120f0b18297f7efe22452f9b3aca0d8d", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.9706877689258586, "ground_truth": 0}, {"key": "55a6aabd120f0b18297f7efe22452f9b3aca0d8d", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.8824278666734734, "ground_truth": 0}, {"key": "55a6aabd120f0b18297f7efe22452f9b3aca0d8d", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.893309398160891, "ground_truth": 0}, {"key": "55a6aabd120f0b18297f7efe22452f9b3aca0d8d", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.9726235116667801, "ground_truth": 0}, {"key": "06bc2f0272d033b123e9eebbb221c62d7d51c283", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.6095241433361156, "ground_truth": 0}, {"key": "06bc2f0272d033b123e9eebbb221c62d7d51c283", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.44167302504720585, "ground_truth": 0}, {"key": "06bc2f0272d033b123e9eebbb221c62d7d51c283", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.09467769891625381, "ground_truth": 0}, {"key": "06bc2f0272d033b123e9eebbb221c62d7d51c283", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.22953522162686607, "ground_truth": 0}, {"key": "06bc2f0272d033b123e9eebbb221c62d7d51c283", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.23792989811390206, "ground_truth": 0}, {"key": "17e43e8e7d2bbbb237df78537d108c3fa917d9fb", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.9678992931265199, "ground_truth": 0}, {"key": "17e43e8e7d2bbbb237df78537d108c3fa917d9fb", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.9539660991436806, "ground_truth": 0}, {"key": "17e43e8e7d2bbbb237df78537d108c3fa917d9fb", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.9348724528307923, "ground_truth": 0}, {"key": "17e43e8e7d2bbbb237df78537d108c3fa917d9fb", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.9536217940005829, "ground_truth": 0}, {"key": "17e43e8e7d2bbbb237df78537d108c3fa917d9fb", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.9658995740574124, "ground_truth": 0}, {"key": "ddcdeb9bdd19fa23f9495c85d48eeee910f33102", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.3208213017075409, "ground_truth": 0}, {"key": "ddcdeb9bdd19fa23f9495c85d48eeee910f33102", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.40356686874692504, "ground_truth": 0}, {"key": "ddcdeb9bdd19fa23f9495c85d48eeee910f33102", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.3415824877417378, "ground_truth": 0}, {"key": "ddcdeb9bdd19fa23f9495c85d48eeee910f33102", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.41489882985370685, "ground_truth": 0}, {"key": "ddcdeb9bdd19fa23f9495c85d48eeee910f33102", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.2861692496735999, "ground_truth": 0}, {"key": "ee0ba7928d8987f2cb21c9a2012a76730f77de45", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.33807712894388764, "ground_truth": 0}, {"key": "ee0ba7928d8987f2cb21c9a2012a76730f77de45", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.4263216047156491, "ground_truth": 0}, {"key": "ee0ba7928d8987f2cb21c9a2012a76730f77de45", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.586996430654341, "ground_truth": 0}, {"key": "ee0ba7928d8987f2cb21c9a2012a76730f77de45", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.21206879941858517, "ground_truth": 0}, {"key": "ee0ba7928d8987f2cb21c9a2012a76730f77de45", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.4148988457337432, "ground_truth": 0}, {"key": "554fd99f28ae12472c5d99ef6383bb184744c25a", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.7853085792989187, "ground_truth": 0}, {"key": "554fd99f28ae12472c5d99ef6383bb184744c25a", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.4493926577516046, "ground_truth": 0}, {"key": "554fd99f28ae12472c5d99ef6383bb184744c25a", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.5214711608104076, "ground_truth": 0}, {"key": "554fd99f28ae12472c5d99ef6383bb184744c25a", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.5486735015954086, "ground_truth": 0}, {"key": "554fd99f28ae12472c5d99ef6383bb184744c25a", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.4882834083315681, "ground_truth": 0}, {"key": "9e141ebc1c06d483bf85f4e5c8b3c7bc2d00ea2f", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.37204880090188575, "ground_truth": 0}, {"key": "9e141ebc1c06d483bf85f4e5c8b3c7bc2d00ea2f", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.2735743930061615, "ground_truth": 0}, {"key": "9e141ebc1c06d483bf85f4e5c8b3c7bc2d00ea2f", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.336331048818529, "ground_truth": 0}, {"key": "9e141ebc1c06d483bf85f4e5c8b3c7bc2d00ea2f", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.2213507037668293, "ground_truth": 0}, {"key": "9e141ebc1c06d483bf85f4e5c8b3c7bc2d00ea2f", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.40544871378065656, "ground_truth": 0}, {"key": "c9160e2f5ce386dabb10517e7a5c0933c01a9546", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.3073580129640087, "ground_truth": 0}, {"key": "c9160e2f5ce386dabb10517e7a5c0933c01a9546", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.2735743807087145, "ground_truth": 0}, {"key": "c9160e2f5ce386dabb10517e7a5c0933c01a9546", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.34687307631767866, "ground_truth": 0}, {"key": "c9160e2f5ce386dabb10517e7a5c0933c01a9546", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.43782350417018323, "ground_truth": 0}, {"key": "c9160e2f5ce386dabb10517e7a5c0933c01a9546", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.31573597342339993, "ground_truth": 0}, {"key": "d256aee1a47eb5b489dee6fb72ab7f7d1483a37f", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.12852513472473706, "ground_truth": 0}, {"key": "d256aee1a47eb5b489dee6fb72ab7f7d1483a37f", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.11757213290485234, "ground_truth": 0}, {"key": "d256aee1a47eb5b489dee6fb72ab7f7d1483a37f", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.16776334860620973, "ground_truth": 0}, {"key": "d256aee1a47eb5b489dee6fb72ab7f7d1483a37f", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.11676401150087559, "ground_truth": 0}, {"key": "d256aee1a47eb5b489dee6fb72ab7f7d1483a37f", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.1347759160010157, "ground_truth": 0}, {"key": "2fff2bc541ef34a6647dfa2e4294cdcc187e47b9", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.2173375014736449, "ground_truth": 0}, {"key": "2fff2bc541ef34a6647dfa2e4294cdcc187e47b9", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.21601153721022864, "ground_truth": 0}, {"key": "2fff2bc541ef34a6647dfa2e4294cdcc187e47b9", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.19930799145220035, "ground_truth": 0}, {"key": "2fff2bc541ef34a6647dfa2e4294cdcc187e47b9", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.18010666339556491, "ground_truth": 0}, {"key": "2fff2bc541ef34a6647dfa2e4294cdcc187e47b9", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.464901553318302, "ground_truth": 0}, {"key": "677375a4c69e81ab623af7c06a6b0a8d03d6350e", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.35398630787473656, "ground_truth": 0}, {"key": "677375a4c69e81ab623af7c06a6b0a8d03d6350e", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.3849121707451956, "ground_truth": 0}, {"key": "677375a4c69e81ab623af7c06a6b0a8d03d6350e", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.4205995869129507, "ground_truth": 0}, {"key": "677375a4c69e81ab623af7c06a6b0a8d03d6350e", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.6020615857140927, "ground_truth": 0}, {"key": "677375a4c69e81ab623af7c06a6b0a8d03d6350e", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.45713671689209023, "ground_truth": 0}, {"key": "33530f97118cc905b05cb920671492c7bfdf3a3b", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.43782348462155235, "ground_truth": 0}, {"key": "33530f97118cc905b05cb920671492c7bfdf3a3b", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.4263215779499737, "ground_truth": 0}, {"key": "33530f97118cc905b05cb920671492c7bfdf3a3b", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.31912137790569844, "ground_truth": 0}, {"key": "33530f97118cc905b05cb920671492c7bfdf3a3b", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.2553436458796829, "ground_truth": 0}, {"key": "33530f97118cc905b05cb920671492c7bfdf3a3b", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.28937170397758233, "ground_truth": 0}, {"key": "3c19a753303ae0d67b3ae28e070c0f4157ffc52d", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.345105283543969, "ground_truth": 0}, {"key": "3c19a753303ae0d67b3ae28e070c0f4157ffc52d", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.18832398171658418, "ground_truth": 0}, {"key": "3c19a753303ae0d67b3ae28e070c0f4157ffc52d", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.233706340004734, "ground_truth": 0}, {"key": "3c19a753303ae0d67b3ae28e070c0f4157ffc52d", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.13753247013886127, "ground_truth": 0}, {"key": "3c19a753303ae0d67b3ae28e070c0f4157ffc52d", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.11920292782789232, "ground_truth": 0}, {"key": "9313988d26672c576f08e130c895edf20d8aa626", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.2674081611767586, "ground_truth": 0}, {"key": "9313988d26672c576f08e130c895edf20d8aa626", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.4186969160334731, "ground_truth": 0}, {"key": "9313988d26672c576f08e130c895edf20d8aa626", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.2120688067457063, "ground_truth": 0}, {"key": "9313988d26672c576f08e130c895edf20d8aa626", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.4590761279375542, "ground_truth": 0}, {"key": "9313988d26672c576f08e130c895edf20d8aa626", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.5039061446268793, "ground_truth": 0}, {"key": "72f4a6670ec7ec915c83d58bb0ebf152b1605bb6", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.27357438225647795, "ground_truth": 0}, {"key": "72f4a6670ec7ec915c83d58bb0ebf152b1605bb6", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.7122321916182545, "ground_truth": 0}, {"key": "72f4a6670ec7ec915c83d58bb0ebf152b1605bb6", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.390475853879848, "ground_truth": 0}, {"key": "72f4a6670ec7ec915c83d58bb0ebf152b1605bb6", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.2974699633070511, "ground_truth": 0}, {"key": "72f4a6670ec7ec915c83d58bb0ebf152b1605bb6", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.25091278358650015, "ground_truth": 0}, {"key": "b73f50e29d5b2943eb315643bef8ee4e09f5605b", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.08945460155536017, "ground_truth": 0}, {"key": "b73f50e29d5b2943eb315643bef8ee4e09f5605b", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.07477004805257767, "ground_truth": 0}, {"key": "b73f50e29d5b2943eb315643bef8ee4e09f5605b", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.09138210432147892, "ground_truth": 0}, {"key": "b73f50e29d5b2943eb315643bef8ee4e09f5605b", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.10158944877786497, "ground_truth": 0}, {"key": "b73f50e29d5b2943eb315643bef8ee4e09f5605b", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.04401865099580226, "ground_truth": 0}, {"key": "f9689fb9656132e1c6d186851563f2b968643791", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.3174262766928121, "ground_truth": 0}, {"key": "f9689fb9656132e1c6d186851563f2b968643791", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.37754065911236845, "ground_truth": 0}, {"key": "f9689fb9656132e1c6d186851563f2b968643791", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.10818895089096088, "ground_truth": 0}, {"key": "f9689fb9656132e1c6d186851563f2b968643791", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.3380771398368994, "ground_truth": 0}, {"key": "f9689fb9656132e1c6d186851563f2b968643791", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.31069438610581773, "ground_truth": 0}, {"key": "63831b842812b1a3d05b04904a10d160fe7ad2af", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.4148988388529616, "ground_truth": 0}, {"key": "63831b842812b1a3d05b04904a10d160fe7ad2af", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.44552954716109244, "ground_truth": 0}, {"key": "63831b842812b1a3d05b04904a10d160fe7ad2af", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.4378234850296388, "ground_truth": 0}, {"key": "63831b842812b1a3d05b04904a10d160fe7ad2af", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.5350984285999636, "ground_truth": 0}, {"key": "63831b842812b1a3d05b04904a10d160fe7ad2af", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.45326184487225374, "ground_truth": 0}, {"key": "05688bac0e46542be65a6df240428a6f26c86fd0", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.36477757386749193, "ground_truth": 0}, {"key": "05688bac0e46542be65a6df240428a6f26c86fd0", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.6959583152434817, "ground_truth": 0}, {"key": "05688bac0e46542be65a6df240428a6f26c86fd0", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.3720487997344155, "ground_truth": 0}, {"key": "05688bac0e46542be65a6df240428a6f26c86fd0", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.46101676299872635, "ground_truth": 0}, {"key": "05688bac0e46542be65a6df240428a6f26c86fd0", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.7718435095857098, "ground_truth": 0}, {"key": "5ba0d22ccba29ac8a3c77da069165d6016f5a214", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.19314738479094656, "ground_truth": 0}, {"key": "5ba0d22ccba29ac8a3c77da069165d6016f5a214", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.28457600579481096, "ground_truth": 0}, {"key": "5ba0d22ccba29ac8a3c77da069165d6016f5a214", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.4225046152535055, "ground_truth": 0}, {"key": "5ba0d22ccba29ac8a3c77da069165d6016f5a214", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.19806417457924977, "ground_truth": 0}, {"key": "5ba0d22ccba29ac8a3c77da069165d6016f5a214", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.3451052790535727, "ground_truth": 0}, {"key": "9f63d6256158d260c426a9336d19b760d9bc5a48", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.3090237108663427, "ground_truth": 0}, {"key": "9f63d6256158d260c426a9336d19b760d9bc5a48", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.4397473319358389, "ground_truth": 0}, {"key": "9f63d6256158d260c426a9336d19b760d9bc5a48", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.29746994383934583, "ground_truth": 0}, {"key": "9f63d6256158d260c426a9336d19b760d9bc5a48", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.13477591962079905, "ground_truth": 0}, {"key": "9f63d6256158d260c426a9336d19b760d9bc5a48", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.7662936686481292, "ground_truth": 0}, {"key": "fb6516de631cade629b797e8f40f377523c4aa0e", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.5660185299823667, "ground_truth": 0}, {"key": "fb6516de631cade629b797e8f40f377523c4aa0e", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.46879062882588113, "ground_truth": 0}, {"key": "fb6516de631cade629b797e8f40f377523c4aa0e", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.6315942916907376, "ground_truth": 0}, {"key": "fb6516de631cade629b797e8f40f377523c4aa0e", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.36658975693362617, "ground_truth": 0}, {"key": "fb6516de631cade629b797e8f40f377523c4aa0e", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.5195213036596708, "ground_truth": 0}, {"key": "0a71f063b78184b4ca2ffee3c642d48dc27ef91b", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.31236999889897754, "ground_truth": 0}, {"key": "0a71f063b78184b4ca2ffee3c642d48dc27ef91b", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.25386101850938064, "ground_truth": 0}, {"key": "0a71f063b78184b4ca2ffee3c642d48dc27ef91b", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.2309197567042978, "ground_truth": 0}, {"key": "0a71f063b78184b4ca2ffee3c642d48dc27ef91b", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.1451153493004376, "ground_truth": 0}, {"key": "0a71f063b78184b4ca2ffee3c642d48dc27ef91b", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.16344543376284404, "ground_truth": 0}, {"key": "700e0d133d2f5c2e65960aae7bffa66bb62c0df4", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.7577943699511699, "ground_truth": 0}, {"key": "700e0d133d2f5c2e65960aae7bffa66bb62c0df4", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.6242935189057595, "ground_truth": 0}, {"key": "700e0d133d2f5c2e65960aae7bffa66bb62c0df4", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.49609384738480317, "ground_truth": 0}, {"key": "700e0d133d2f5c2e65960aae7bffa66bb62c0df4", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.6654105599843749, "ground_truth": 0}, {"key": "700e0d133d2f5c2e65960aae7bffa66bb62c0df4", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.7648916091639458, "ground_truth": 0}, {"key": "180642a2ddfce93ceaf3ee3ec4779400fe67ae1e", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.6261241724172651, "ground_truth": 0}, {"key": "180642a2ddfce93ceaf3ee3ec4779400fe67ae1e", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.23934933521717153, "ground_truth": 0}, {"key": "180642a2ddfce93ceaf3ee3ec4779400fe67ae1e", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.734119522791158, "ground_truth": 0}, {"key": "180642a2ddfce93ceaf3ee3ec4779400fe67ae1e", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.5794003929862628, "ground_truth": 0}, {"key": "180642a2ddfce93ceaf3ee3ec4779400fe67ae1e", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.5019531248140124, "ground_truth": 0}, {"key": "3e868fbad714ceab14a41fa9dd5d8a40204f2199", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.7185944001483457, "ground_truth": 0}, {"key": "3e868fbad714ceab14a41fa9dd5d8a40204f2199", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.29421496743245856, "ground_truth": 0}, {"key": "3e868fbad714ceab14a41fa9dd5d8a40204f2199", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.27669052196294064, "ground_truth": 0}, {"key": "3e868fbad714ceab14a41fa9dd5d8a40204f2199", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.4073334137076154, "ground_truth": 0}, {"key": "3e868fbad714ceab14a41fa9dd5d8a40204f2199", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.39981165773664556, "ground_truth": 0}, {"key": "8b0a818edcbbefb79dd40a19b08119f6848083db", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.29098086296045444, "ground_truth": 0}, {"key": "8b0a818edcbbefb79dd40a19b08119f6848083db", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.4397473319358389, "ground_truth": 0}, {"key": "8b0a818edcbbefb79dd40a19b08119f6848083db", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.15817435602592225, "ground_truth": 0}, {"key": "8b0a818edcbbefb79dd40a19b08119f6848083db", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.28937170355439856, "ground_truth": 0}, {"key": "8b0a818edcbbefb79dd40a19b08119f6848083db", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.5078118841110785, "ground_truth": 0}, {"key": "ceb7a288ac1ad604a17bc25c5978fcc87b1a4446", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.29746994869430343, "ground_truth": 0}, {"key": "ceb7a288ac1ad604a17bc25c5978fcc87b1a4446", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.24653333295335694, "ground_truth": 0}, {"key": "ceb7a288ac1ad604a17bc25c5978fcc87b1a4446", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.19806416934893145, "ground_truth": 0}, {"key": "ceb7a288ac1ad604a17bc25c5978fcc87b1a4446", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.3593641279074841, "ground_truth": 0}, {"key": "ceb7a288ac1ad604a17bc25c5978fcc87b1a4446", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.27048021239178766, "ground_truth": 0}, {"key": "a228e744966fe03eca515b971329acacf9feabb2", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.5448013977404046, "ground_truth": 0}, {"key": "a228e744966fe03eca515b971329acacf9feabb2", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.4571367381143821, "ground_truth": 0}, {"key": "a228e744966fe03eca515b971329acacf9feabb2", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.23370634337041893, "ground_truth": 0}, {"key": "a228e744966fe03eca515b971329acacf9feabb2", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.38306417752204536, "ground_truth": 0}, {"key": "a228e744966fe03eca515b971329acacf9feabb2", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.4980468793730908, "ground_truth": 0}, {"key": "c44238ec87e7fc40ab7fe6e724cfcbf301e01216", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.8104789018063401, "ground_truth": 0}, {"key": "c44238ec87e7fc40ab7fe6e724cfcbf301e01216", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.22815650567260992, "ground_truth": 0}, {"key": "c44238ec87e7fc40ab7fe6e724cfcbf301e01216", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.5563995695728947, "ground_truth": 0}, {"key": "c44238ec87e7fc40ab7fe6e724cfcbf301e01216", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.45519861754630014, "ground_truth": 0}, {"key": "c44238ec87e7fc40ab7fe6e724cfcbf301e01216", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.15921740798046877, "ground_truth": 0}, {"key": "fff32094b00f3780cc98fe43bd98aace4b851281", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.18126321186162403, "ground_truth": 0}, {"key": "fff32094b00f3780cc98fe43bd98aace4b851281", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.4474602987222152, "ground_truth": 0}, {"key": "fff32094b00f3780cc98fe43bd98aace4b851281", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.1688569504331793, "ground_truth": 0}, {"key": "fff32094b00f3780cc98fe43bd98aace4b851281", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.3208213168262635, "ground_truth": 0}, {"key": "fff32094b00f3780cc98fe43bd98aace4b851281", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.2845760000670998, "ground_truth": 0}, {"key": "373ef5be1d84b8c4905193e569e0cf8a7ead3d03", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.11676401228583147, "ground_truth": 0}, {"key": "373ef5be1d84b8c4905193e569e0cf8a7ead3d03", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.20055768437750257, "ground_truth": 0}, {"key": "373ef5be1d84b8c4905193e569e0cf8a7ead3d03", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.2509127954763484, "ground_truth": 0}, {"key": "373ef5be1d84b8c4905193e569e0cf8a7ead3d03", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.27357439847874, "ground_truth": 0}, {"key": "373ef5be1d84b8c4905193e569e0cf8a7ead3d03", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.5039061663932048, "ground_truth": 0}, {"key": "f372b28e3d1f74d60aa8ee29d7bdd49a6e7f9779", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.9314625052898561, "ground_truth": 0}, {"key": "f372b28e3d1f74d60aa8ee29d7bdd49a6e7f9779", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.9553191259868381, "ground_truth": 0}, {"key": "f372b28e3d1f74d60aa8ee29d7bdd49a6e7f9779", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.8749346211261854, "ground_truth": 0}, {"key": "f372b28e3d1f74d60aa8ee29d7bdd49a6e7f9779", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.9299510395888873, "ground_truth": 0}, {"key": "f372b28e3d1f74d60aa8ee29d7bdd49a6e7f9779", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.9136765192980891, "ground_truth": 0}, {"key": "fbcaa7519e9ff82193afbaed67d8706f2350125f", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.3886180327288401, "ground_truth": 0}, {"key": "fbcaa7519e9ff82193afbaed67d8706f2350125f", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.7931059346845307, "ground_truth": 0}, {"key": "fbcaa7519e9ff82193afbaed67d8706f2350125f", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.3830641958269361, "ground_truth": 0}, {"key": "fbcaa7519e9ff82193afbaed67d8706f2350125f", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.6477982229738228, "ground_truth": 0}, {"key": "fbcaa7519e9ff82193afbaed67d8706f2350125f", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.6132365529539044, "ground_truth": 0}, {"key": "5ebd041d89a2ba41b387c30293f0657eef746910", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.523420329357827, "ground_truth": 0}, {"key": "5ebd041d89a2ba41b387c30293f0657eef746910", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.2295352044152671, "ground_truth": 0}, {"key": "5ebd041d89a2ba41b387c30293f0657eef746910", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.6020615815952373, "ground_truth": 0}, {"key": "5ebd041d89a2ba41b387c30293f0657eef746910", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.34864516490386727, "ground_truth": 0}, {"key": "5ebd041d89a2ba41b387c30293f0657eef746910", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.35936412614537444, "ground_truth": 0}, {"key": "ac4ae79796d05506dabe4380c24f7dd423e09965", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.33982761764821384, "ground_truth": 0}, {"key": "ac4ae79796d05506dabe4380c24f7dd423e09965", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.3040416885632722, "ground_truth": 0}, {"key": "ac4ae79796d05506dabe4380c24f7dd423e09965", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.22270014268838545, "ground_truth": 0}, {"key": "ac4ae79796d05506dabe4380c24f7dd423e09965", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.5428632608230155, "ground_truth": 0}, {"key": "ac4ae79796d05506dabe4380c24f7dd423e09965", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.7662936490859791, "ground_truth": 0}, {"key": "62827a1a377491d88adcbac25ecf14a64b5f997b", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.5563995786075341, "ground_truth": 0}, {"key": "62827a1a377491d88adcbac25ecf14a64b5f997b", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.6876299929316867, "ground_truth": 0}, {"key": "62827a1a377491d88adcbac25ecf14a64b5f997b", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.5888891360700633, "ground_truth": 0}, {"key": "62827a1a377491d88adcbac25ecf14a64b5f997b", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.5175708840916013, "ground_truth": 0}, {"key": "62827a1a377491d88adcbac25ecf14a64b5f997b", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.5888891324751485, "ground_truth": 0}, {"key": "d42463e1093a92ec4dbd20edd8f4bf3306f00f3f", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.22815650688495262, "ground_truth": 0}, {"key": "d42463e1093a92ec4dbd20edd8f4bf3306f00f3f", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.2309197515911806, "ground_truth": 0}, {"key": "d42463e1093a92ec4dbd20edd8f4bf3306f00f3f", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.2583259733191504, "ground_truth": 0}, {"key": "d42463e1093a92ec4dbd20edd8f4bf3306f00f3f", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.22405545745538918, "ground_truth": 0}, {"key": "d42463e1093a92ec4dbd20edd8f4bf3306f00f3f", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.24798745411790643, "ground_truth": 0}, {"key": "4b0eda92463958cce8c6b2537db39088e1254552", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.5621765046333077, "ground_truth": 0}, {"key": "4b0eda92463958cce8c6b2537db39088e1254552", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.6976089172758676, "ground_truth": 0}, {"key": "4b0eda92463958cce8c6b2537db39088e1254552", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.4397473367845295, "ground_truth": 0}, {"key": "4b0eda92463958cce8c6b2537db39088e1254552", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.42632159282573123, "ground_truth": 0}, {"key": "4b0eda92463958cce8c6b2537db39088e1254552", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.42059959559648713, "ground_truth": 0}, {"key": "e117408ad19cc69e15b1e21b9ae54f10c07223ce", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.4263215793121128, "ground_truth": 0}, {"key": "e117408ad19cc69e15b1e21b9ae54f10c07223ce", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.3345894224537619, "ground_truth": 0}, {"key": "e117408ad19cc69e15b1e21b9ae54f10c07223ce", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.6992544252062154, "ground_truth": 0}, {"key": "e117408ad19cc69e15b1e21b9ae54f10c07223ce", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.2523840421799757, "ground_truth": 0}, {"key": "e117408ad19cc69e15b1e21b9ae54f10c07223ce", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.36477758881026373, "ground_truth": 0}, {"key": "3c5b68b58c34853baa534d1265ec7fde00d4eb4e", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.27202456521250257, "ground_truth": 0}, {"key": "3c5b68b58c34853baa534d1265ec7fde00d4eb4e", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.5214711434020868, "ground_truth": 0}, {"key": "3c5b68b58c34853baa534d1265ec7fde00d4eb4e", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.556399578268508, "ground_truth": 0}, {"key": "3c5b68b58c34853baa534d1265ec7fde00d4eb4e", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.24364242041592427, "ground_truth": 0}, {"key": "3c5b68b58c34853baa534d1265ec7fde00d4eb4e", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.48633152700839, "ground_truth": 0}, {"key": "6c3d2feed04c75063d182103f0585c45da9aaa1b", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.35577488294285253, "ground_truth": 0}, {"key": "6c3d2feed04c75063d182103f0585c45da9aaa1b", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.3123700158944418, "ground_truth": 0}, {"key": "6c3d2feed04c75063d182103f0585c45da9aaa1b", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.339827629947221, "ground_truth": 0}, {"key": "6c3d2feed04c75063d182103f0585c45da9aaa1b", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.37754067034719857, "ground_truth": 0}, {"key": "6c3d2feed04c75063d182103f0585c45da9aaa1b", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.1655931140565549, "ground_truth": 0}, {"key": "4fa1c0bd7f86368d7ae7730d95ff7e73dc9172da", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.7772998532441808, "ground_truth": 0}, {"key": "4fa1c0bd7f86368d7ae7730d95ff7e73dc9172da", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.6388352931812913, "ground_truth": 0}, {"key": "4fa1c0bd7f86368d7ae7730d95ff7e73dc9172da", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.6654105593738672, "ground_truth": 0}, {"key": "4fa1c0bd7f86368d7ae7730d95ff7e73dc9172da", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.6297746359478407, "ground_truth": 0}, {"key": "4fa1c0bd7f86368d7ae7730d95ff7e73dc9172da", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.8509646989494664, "ground_truth": 0}, {"key": "282f1910bd57e50d4401c695ebe75b817de68548", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.759225402405664, "ground_truth": 0}, {"key": "282f1910bd57e50d4401c695ebe75b817de68548", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.5525397156337913, "ground_truth": 0}, {"key": "282f1910bd57e50d4401c695ebe75b817de68548", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.38861801678158925, "ground_truth": 0}, {"key": "282f1910bd57e50d4401c695ebe75b817de68548", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.7563575934468681, "ground_truth": 0}, {"key": "282f1910bd57e50d4401c695ebe75b817de68548", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.7704648013109145, "ground_truth": 0}, {"key": "af2d712599be471d1ba0b91fa18c347220ca595d", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.18242553179054546, "ground_truth": 0}, {"key": "af2d712599be471d1ba0b91fa18c347220ca595d", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.3575675221814992, "ground_truth": 0}, {"key": "af2d712599be471d1ba0b91fa18c347220ca595d", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.4225046259917193, "ground_truth": 0}, {"key": "af2d712599be471d1ba0b91fa18c347220ca595d", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.38861800314245126, "ground_truth": 0}, {"key": "af2d712599be471d1ba0b91fa18c347220ca595d", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.36477755885489876, "ground_truth": 0}, {"key": "e3dd06d326c8d53722bdc5c8428e29c68a60d0d5", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.245085005723811, "ground_truth": 0}, {"key": "e3dd06d326c8d53722bdc5c8428e29c68a60d0d5", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.47073659992695654, "ground_truth": 0}, {"key": "e3dd06d326c8d53722bdc5c8428e29c68a60d0d5", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.22135069616290615, "ground_truth": 0}, {"key": "e3dd06d326c8d53722bdc5c8428e29c68a60d0d5", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.24508501102576213, "ground_truth": 0}, {"key": "e3dd06d326c8d53722bdc5c8428e29c68a60d0d5", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.24364246266177833, "ground_truth": 0}, {"key": "493fa8c40d1bc26ed1d25633c779b13bc33efdba", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.172171851398928, "ground_truth": 0}, {"key": "493fa8c40d1bc26ed1d25633c779b13bc33efdba", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.48242913774333046, "ground_truth": 0}, {"key": "493fa8c40d1bc26ed1d25633c779b13bc33efdba", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.3023910886314008, "ground_truth": 0}, {"key": "493fa8c40d1bc26ed1d25633c779b13bc33efdba", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.16776334230123388, "ground_truth": 0}, {"key": "493fa8c40d1bc26ed1d25633c779b13bc33efdba", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.3363310523861124, "ground_truth": 0}, {"key": "56d7d67bb0fc32ee71cc006b915244776d883661", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.840782591771595, "ground_truth": 0}, {"key": "56d7d67bb0fc32ee71cc006b915244776d883661", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.6876299908632001, "ground_truth": 0}, {"key": "56d7d67bb0fc32ee71cc006b915244776d883661", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.7676898571522903, "ground_truth": 0}, {"key": "56d7d67bb0fc32ee71cc006b915244776d883661", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.8221891227619164, "ground_truth": 0}, {"key": "56d7d67bb0fc32ee71cc006b915244776d883661", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.3960681583179306, "ground_truth": 0}, {"key": "2b08ee205946dc0bb6ffe0db654cbbba1199eb28", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.414898844510928, "ground_truth": 0}, {"key": "2b08ee205946dc0bb6ffe0db654cbbba1199eb28", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.46295861537795024, "ground_truth": 0}, {"key": "2b08ee205946dc0bb6ffe0db654cbbba1199eb28", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.25832599998495726, "ground_truth": 0}, {"key": "2b08ee205946dc0bb6ffe0db654cbbba1199eb28", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.3174262428801041, "ground_truth": 0}, {"key": "2b08ee205946dc0bb6ffe0db654cbbba1199eb28", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.5486735095252133, "ground_truth": 0}, {"key": "782c4bdaee73189103d2e05748717b3ea0e89e5d", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.41679666332021814, "ground_truth": 0}, {"key": "782c4bdaee73189103d2e05748717b3ea0e89e5d", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.7759445349206161, "ground_truth": 0}, {"key": "782c4bdaee73189103d2e05748717b3ea0e89e5d", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.18126320138087668, "ground_truth": 0}, {"key": "782c4bdaee73189103d2e05748717b3ea0e89e5d", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.3886180217814444, "ground_truth": 0}, {"key": "782c4bdaee73189103d2e05748717b3ea0e89e5d", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.49218813631674324, "ground_truth": 0}, {"key": "87385fb51ac9eaf76e8421723c94410f724750fc", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.33458944070029073, "ground_truth": 0}, {"key": "87385fb51ac9eaf76e8421723c94410f724750fc", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.3886180168560796, "ground_truth": 0}, {"key": "87385fb51ac9eaf76e8421723c94410f724750fc", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.3684057170685793, "ground_truth": 0}, {"key": "87385fb51ac9eaf76e8421723c94410f724750fc", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.5350984210055294, "ground_truth": 0}, {"key": "87385fb51ac9eaf76e8421723c94410f724750fc", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.40168780556549266, "ground_truth": 0}, {"key": "20528eb48341b50c0083fcf5a9d114b39040e5c1", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.4726834733839977, "ground_truth": 0}, {"key": "20528eb48341b50c0083fcf5a9d114b39040e5c1", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.6636689434929363, "ground_truth": 0}, {"key": "20528eb48341b50c0083fcf5a9d114b39040e5c1", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.4610167790618647, "ground_truth": 0}, {"key": "20528eb48341b50c0083fcf5a9d114b39040e5c1", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.5448013907334891, "ground_truth": 0}, {"key": "20528eb48341b50c0083fcf5a9d114b39040e5c1", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.5448013656114215, "ground_truth": 0}, {"key": "412630c97420afb50e5278d3406e0cf4b08d0b77", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.18594721518896695, "ground_truth": 0}, {"key": "412630c97420afb50e5278d3406e0cf4b08d0b77", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.18832398007814105, "ground_truth": 0}, {"key": "412630c97420afb50e5278d3406e0cf4b08d0b77", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.2227001503324516, "ground_truth": 0}, {"key": "412630c97420afb50e5278d3406e0cf4b08d0b77", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.09203285965707173, "ground_truth": 0}, {"key": "412630c97420afb50e5278d3406e0cf4b08d0b77", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.16667540244614007, "ground_truth": 0}, {"key": "dcd60a85e1e17ec0163a925c9412d480fd08072f", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.5467381566442258, "ground_truth": 0}, {"key": "dcd60a85e1e17ec0163a925c9412d480fd08072f", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.422504633871819, "ground_truth": 0}, {"key": "dcd60a85e1e17ec0163a925c9412d480fd08072f", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.39420094225055685, "ground_truth": 0}, {"key": "dcd60a85e1e17ec0163a925c9412d480fd08072f", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.1710611818522735, "ground_truth": 0}, {"key": "dcd60a85e1e17ec0163a925c9412d480fd08072f", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.41300358568905904, "ground_truth": 0}, {"key": "805644d370fae7b0492174c54c00e86eff742735", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.6531269649958623, "ground_truth": 0}, {"key": "805644d370fae7b0492174c54c00e86eff742735", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.7217432140430042, "ground_truth": 0}, {"key": "805644d370fae7b0492174c54c00e86eff742735", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.49609384429268255, "ground_truth": 0}, {"key": "805644d370fae7b0492174c54c00e86eff742735", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.5, "ground_truth": 0}, {"key": "805644d370fae7b0492174c54c00e86eff742735", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.40544874732720315, "ground_truth": 0}, {"key": "3aa0ef8cac31a60076c43a9484792b59372edb64", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.49414089727634675, "ground_truth": 0}, {"key": "3aa0ef8cac31a60076c43a9484792b59372edb64", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.6057990571362892, "ground_truth": 0}, {"key": "3aa0ef8cac31a60076c43a9484792b59372edb64", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.36116471440876835, "ground_truth": 0}, {"key": "3aa0ef8cac31a60076c43a9484792b59372edb64", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.2861692667035502, "ground_truth": 0}, {"key": "3aa0ef8cac31a60076c43a9484792b59372edb64", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.5907791905955703, "ground_truth": 0}, {"key": "4cf51ce9372dff8ff7f44f098eab1c1d7569af7a", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.20817893432553763, "ground_truth": 0}, {"key": "4cf51ce9372dff8ff7f44f098eab1c1d7569af7a", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.5058591224461868, "ground_truth": 0}, {"key": "4cf51ce9372dff8ff7f44f098eab1c1d7569af7a", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.38491213625848075, "ground_truth": 0}, {"key": "4cf51ce9372dff8ff7f44f098eab1c1d7569af7a", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.20181322237144655, "ground_truth": 0}, {"key": "4cf51ce9372dff8ff7f44f098eab1c1d7569af7a", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.6187804395031269, "ground_truth": 0}, {"key": "ea06fd0b25cb9793397a51de73fd83f91b4323fa", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.3433417409184125, "ground_truth": 0}, {"key": "ea06fd0b25cb9793397a51de73fd83f91b4323fa", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.22678363083786357, "ground_truth": 0}, {"key": "ea06fd0b25cb9793397a51de73fd83f91b4323fa", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.5019530970563195, "ground_truth": 0}, {"key": "ea06fd0b25cb9793397a51de73fd83f91b4323fa", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.267408162353203, "ground_truth": 0}, {"key": "ea06fd0b25cb9793397a51de73fd83f91b4323fa", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.3522017825837246, "ground_truth": 0}, {"key": "a150e93fa52eaba281aae9eabe28b3ee4155f296", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.26284185026978873, "ground_truth": 0}, {"key": "a150e93fa52eaba281aae9eabe28b3ee4155f296", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.30735802338293994, "ground_truth": 0}, {"key": "a150e93fa52eaba281aae9eabe28b3ee4155f296", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.15713686380657457, "ground_truth": 0}, {"key": "a150e93fa52eaba281aae9eabe28b3ee4155f296", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.15002881688790903, "ground_truth": 0}, {"key": "a150e93fa52eaba281aae9eabe28b3ee4155f296", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.2909808583014386, "ground_truth": 0}, {"key": "a0a84718168357049273f6e65133fd06e67cd6d2", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.292595296700592, "ground_truth": 0}, {"key": "a0a84718168357049273f6e65133fd06e67cd6d2", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.16238002562887718, "ground_truth": 0}, {"key": "a0a84718168357049273f6e65133fd06e67cd6d2", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.4130035863849479, "ground_truth": 0}, {"key": "a0a84718168357049273f6e65133fd06e67cd6d2", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.5117166107931724, "ground_truth": 0}, {"key": "a0a84718168357049273f6e65133fd06e67cd6d2", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.23934933972634173, "ground_truth": 0}, {"key": "b5833a27ee69d7540435e3c70af040c2b743f541", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.29421497690145576, "ground_truth": 0}, {"key": "b5833a27ee69d7540435e3c70af040c2b743f541", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.15610490071732763, "ground_truth": 0}, {"key": "b5833a27ee69d7540435e3c70af040c2b743f541", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.14414884539454734, "ground_truth": 0}, {"key": "b5833a27ee69d7540435e3c70af040c2b743f541", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.16344543526350205, "ground_truth": 0}, {"key": "b5833a27ee69d7540435e3c70af040c2b743f541", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.1225232146556056, "ground_truth": 0}, {"key": "98dbba54da2a05bb04320aa0e4fb05fba3d75b63", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.5602526212262848, "ground_truth": 0}, {"key": "98dbba54da2a05bb04320aa0e4fb05fba3d75b63", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.6825737379086128, "ground_truth": 0}, {"key": "98dbba54da2a05bb04320aa0e4fb05fba3d75b63", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.44360042963571705, "ground_truth": 0}, {"key": "98dbba54da2a05bb04320aa0e4fb05fba3d75b63", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.5583269869214627, "ground_truth": 0}, {"key": "98dbba54da2a05bb04320aa0e4fb05fba3d75b63", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.4863315514795322, "ground_truth": 0}, {"key": "4a30d8e9ba08a56c1d503d719525113545c414e3", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.5097643933079552, "ground_truth": 0}, {"key": "4a30d8e9ba08a56c1d503d719525113545c414e3", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.8697145750897747, "ground_truth": 0}, {"key": "4a30d8e9ba08a56c1d503d719525113545c414e3", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.40544871520719106, "ground_truth": 0}, {"key": "4a30d8e9ba08a56c1d503d719525113545c414e3", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.22541659906234915, "ground_truth": 0}, {"key": "4a30d8e9ba08a56c1d503d719525113545c414e3", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.7826624778361047, "ground_truth": 0}, {"key": "c3acabb0c18cc7615eb3796406500fba1b148d3d", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.3451052915325813, "ground_truth": 0}, {"key": "c3acabb0c18cc7615eb3796406500fba1b148d3d", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.11279539769186574, "ground_truth": 0}, {"key": "c3acabb0c18cc7615eb3796406500fba1b148d3d", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.2509127902008258, "ground_truth": 0}, {"key": "c3acabb0c18cc7615eb3796406500fba1b148d3d", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.3849121746189579, "ground_truth": 0}, {"key": "c3acabb0c18cc7615eb3796406500fba1b148d3d", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.34510528591550504, "ground_truth": 0}, {"key": "1c1acc74329fe61636f900df9dbcef5ed695e5c9", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.1883239877576101, "ground_truth": 0}, {"key": "1c1acc74329fe61636f900df9dbcef5ed695e5c9", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.413003581189364, "ground_truth": 0}, {"key": "1c1acc74329fe61636f900df9dbcef5ed695e5c9", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.3775406646657143, "ground_truth": 0}, {"key": "1c1acc74329fe61636f900df9dbcef5ed695e5c9", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.15921739624462478, "ground_truth": 0}, {"key": "1c1acc74329fe61636f900df9dbcef5ed695e5c9", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.22678363484488437, "ground_truth": 0}, {"key": "f70a7abb6c5b0ef383ea12a4d9ca046a5bd854e5", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.11047115577356614, "ground_truth": 0}, {"key": "f70a7abb6c5b0ef383ea12a4d9ca046a5bd854e5", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.6001883318394067, "ground_truth": 0}, {"key": "f70a7abb6c5b0ef383ea12a4d9ca046a5bd854e5", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.18476751161751342, "ground_truth": 0}, {"key": "f70a7abb6c5b0ef383ea12a4d9ca046a5bd854e5", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.132066152572146, "ground_truth": 0}, {"key": "f70a7abb6c5b0ef383ea12a4d9ca046a5bd854e5", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.22678361961439664, "ground_truth": 0}, {"key": "a3dd38ec7bc9d7e8423b96d8fd0641a2a5d5c984", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.2720245745655851, "ground_truth": 0}, {"key": "a3dd38ec7bc9d7e8423b96d8fd0641a2a5d5c984", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.7634837747704745, "ground_truth": 0}, {"key": "a3dd38ec7bc9d7e8423b96d8fd0641a2a5d5c984", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.42250463146325856, "ground_truth": 0}, {"key": "a3dd38ec7bc9d7e8423b96d8fd0641a2a5d5c984", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.5078118756663706, "ground_truth": 0}, {"key": "a3dd38ec7bc9d7e8423b96d8fd0641a2a5d5c984", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.2814056158713792, "ground_truth": 0}, {"key": "654c6b29b96d2a5a818d91400c20f838b0e8b6df", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.24364245369514737, "ground_truth": 0}, {"key": "654c6b29b96d2a5a818d91400c20f838b0e8b6df", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.13939637485626838, "ground_truth": 0}, {"key": "654c6b29b96d2a5a818d91400c20f838b0e8b6df", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.3849121447691143, "ground_truth": 0}, {"key": "654c6b29b96d2a5a818d91400c20f838b0e8b6df", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.2146914141249663, "ground_truth": 0}, {"key": "654c6b29b96d2a5a818d91400c20f838b0e8b6df", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.15507846618688845, "ground_truth": 0}, {"key": "764d9ce99a1e3f79d95fbc4b68adbce14e7f8bcd", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.6513548610751255, "ground_truth": 0}, {"key": "764d9ce99a1e3f79d95fbc4b68adbce14e7f8bcd", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.5563995911736753, "ground_truth": 0}, {"key": "764d9ce99a1e3f79d95fbc4b68adbce14e7f8bcd", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.4687906261731622, "ground_truth": 0}, {"key": "764d9ce99a1e3f79d95fbc4b68adbce14e7f8bcd", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.5409238678347011, "ground_truth": 0}, {"key": "764d9ce99a1e3f79d95fbc4b68adbce14e7f8bcd", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.6825737307944076, "ground_truth": 0}, {"key": "f16446db34e2861f0450dfa34d8cdda541ab7b19", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.34687308205171086, "ground_truth": 0}, {"key": "f16446db34e2861f0450dfa34d8cdda541ab7b19", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.5774953745490513, "ground_truth": 0}, {"key": "f16446db34e2861f0450dfa34d8cdda541ab7b19", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.3629691902293054, "ground_truth": 0}, {"key": "f16446db34e2861f0450dfa34d8cdda541ab7b19", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.1302854298173227, "ground_truth": 0}, {"key": "f16446db34e2861f0450dfa34d8cdda541ab7b19", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.41489885075375643, "ground_truth": 0}, {"key": "3e910c5b8425cd7c871a402a32ca44680b53ce5e", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.14223189358484564, "ground_truth": 0}, {"key": "3e910c5b8425cd7c871a402a32ca44680b53ce5e", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.4824291168051054, "ground_truth": 0}, {"key": "3e910c5b8425cd7c871a402a32ca44680b53ce5e", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.5544704576248184, "ground_truth": 0}, {"key": "3e910c5b8425cd7c871a402a32ca44680b53ce5e", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.2735744071801074, "ground_truth": 0}, {"key": "3e910c5b8425cd7c871a402a32ca44680b53ce5e", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.47657963644459345, "ground_truth": 0}, {"key": "973c14551fc97a1eef094bd0f33356d9e6836234", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.715423993457367, "ground_truth": 0}, {"key": "973c14551fc97a1eef094bd0f33356d9e6836234", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.6370308167919835, "ground_truth": 0}, {"key": "973c14551fc97a1eef094bd0f33356d9e6836234", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.5583269729411181, "ground_truth": 0}, {"key": "973c14551fc97a1eef094bd0f33356d9e6836234", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.8311430453900788, "ground_truth": 0}, {"key": "973c14551fc97a1eef094bd0f33356d9e6836234", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.7074046732219925, "ground_truth": 0}, {"key": "725938611c7dca6f876ada93b1d68b29ad25ce38", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.15507846590251784, "ground_truth": 0}, {"key": "725938611c7dca6f876ada93b1d68b29ad25ce38", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.1460872527250678, "ground_truth": 0}, {"key": "725938611c7dca6f876ada93b1d68b29ad25ce38", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.18242553114533336, "ground_truth": 0}, {"key": "725938611c7dca6f876ada93b1d68b29ad25ce38", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.21601153085267855, "ground_truth": 0}, {"key": "725938611c7dca6f876ada93b1d68b29ad25ce38", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.17895590084389743, "ground_truth": 0}, {"key": "28dbcf0c8624d9914a4e4292f872f17b063547c2", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.8998277809229044, "ground_truth": 0}, {"key": "28dbcf0c8624d9914a4e4292f872f17b063547c2", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.7786492994057453, "ground_truth": 0}, {"key": "28dbcf0c8624d9914a4e4292f872f17b063547c2", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.7154240019735613, "ground_truth": 0}, {"key": "28dbcf0c8624d9914a4e4292f872f17b063547c2", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.7416740150835927, "ground_truth": 0}, {"key": "28dbcf0c8624d9914a4e4292f872f17b063547c2", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.8278281448085139, "ground_truth": 0}, {"key": "4567b2098569ee4346cfdede5819257af4ee9c0f", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.5331543939735314, "ground_truth": 0}, {"key": "4567b2098569ee4346cfdede5819257af4ee9c0f", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.7325918428485353, "ground_truth": 0}, {"key": "4567b2098569ee4346cfdede5819257af4ee9c0f", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.48438007046088816, "ground_truth": 0}, {"key": "4567b2098569ee4346cfdede5819257af4ee9c0f", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.7718434963550013, "ground_truth": 0}, {"key": "4567b2098569ee4346cfdede5819257af4ee9c0f", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.5078118792907186, "ground_truth": 0}, {"key": "d0404188997ef57e0355b18fb867599b89c80407", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.209469675968787, "ground_truth": 0}, {"key": "d0404188997ef57e0355b18fb867599b89c80407", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.4378234941640703, "ground_truth": 0}, {"key": "d0404188997ef57e0355b18fb867599b89c80407", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.3923368135192046, "ground_truth": 0}, {"key": "d0404188997ef57e0355b18fb867599b89c80407", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.5851011657936094, "ground_truth": 0}, {"key": "d0404188997ef57e0355b18fb867599b89c80407", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.43206338232877634, "ground_truth": 0}, {"key": "ab10b3f8c4a6cca7aea94298447b13bc0721fe69", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.35756753396658864, "ground_truth": 0}, {"key": "ab10b3f8c4a6cca7aea94298447b13bc0721fe69", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.49804687353780797, "ground_truth": 0}, {"key": "ab10b3f8c4a6cca7aea94298447b13bc0721fe69", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.3208213163119655, "ground_truth": 0}, {"key": "ab10b3f8c4a6cca7aea94298447b13bc0721fe69", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.27669052697838514, "ground_truth": 0}, {"key": "ab10b3f8c4a6cca7aea94298447b13bc0721fe69", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.23792990076018744, "ground_truth": 0}, {"key": "7c11a3353593edde95bae0ee6178fb1d1855baed", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.40922079750434415, "ground_truth": 0}, {"key": "7c11a3353593edde95bae0ee6178fb1d1855baed", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.7577943632400393, "ground_truth": 0}, {"key": "7c11a3353593edde95bae0ee6178fb1d1855baed", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.16132024412266627, "ground_truth": 0}, {"key": "7c11a3353593edde95bae0ee6178fb1d1855baed", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.39233684186336526, "ground_truth": 0}, {"key": "7c11a3353593edde95bae0ee6178fb1d1855baed", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.5467381368586466, "ground_truth": 0}, {"key": "487b272b94a620f9660e89bbf6ebab3ffdf1bf06", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.29746996216956717, "ground_truth": 0}, {"key": "487b272b94a620f9660e89bbf6ebab3ffdf1bf06", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.5409238670469646, "ground_truth": 0}, {"key": "487b272b94a620f9660e89bbf6ebab3ffdf1bf06", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.5736784162345514, "ground_truth": 0}, {"key": "487b272b94a620f9660e89bbf6ebab3ffdf1bf06", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.18476751523444684, "ground_truth": 0}, {"key": "487b272b94a620f9660e89bbf6ebab3ffdf1bf06", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.3998116612562381, "ground_truth": 0}, {"key": "e1b6f4701835710d3f518729188754fcd7061289", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.16451645849655913, "ground_truth": 0}, {"key": "e1b6f4701835710d3f518729188754fcd7061289", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.3849121663553559, "ground_truth": 0}, {"key": "e1b6f4701835710d3f518729188754fcd7061289", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.3557748701792057, "ground_truth": 0}, {"key": "e1b6f4701835710d3f518729188754fcd7061289", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.17106117823059713, "ground_truth": 0}, {"key": "e1b6f4701835710d3f518729188754fcd7061289", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.5058591058924792, "ground_truth": 0}, {"key": "45027afbe54056c567ca8a48906dd06200f6d8c1", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.8322366545038334, "ground_truth": 0}, {"key": "45027afbe54056c567ca8a48906dd06200f6d8c1", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.7969253766631744, "ground_truth": 0}, {"key": "45027afbe54056c567ca8a48906dd06200f6d8c1", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.4130035826039543, "ground_truth": 0}, {"key": "45027afbe54056c567ca8a48906dd06200f6d8c1", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.5813030884255221, "ground_truth": 0}, {"key": "45027afbe54056c567ca8a48906dd06200f6d8c1", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.6095241749119239, "ground_truth": 0}, {"key": "e8c2d4a1d20efb0606506435ebcbf486e9eb4146", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.11757213888731359, "ground_truth": 0}, {"key": "e8c2d4a1d20efb0606506435ebcbf486e9eb4146", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.31069438811738825, "ground_truth": 0}, {"key": "e8c2d4a1d20efb0606506435ebcbf486e9eb4146", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.07640767975755956, "ground_truth": 0}, {"key": "e8c2d4a1d20efb0606506435ebcbf486e9eb4146", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.25386101199927086, "ground_truth": 0}, {"key": "e8c2d4a1d20efb0606506435ebcbf486e9eb4146", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.26894143566552414, "ground_truth": 0}, {"key": "da0ea6b7eae20528c7ec822fb77d8e8f78ba09b8", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.3259495402893156, "ground_truth": 0}, {"key": "da0ea6b7eae20528c7ec822fb77d8e8f78ba09b8", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.5851011546546038, "ground_truth": 0}, {"key": "da0ea6b7eae20528c7ec822fb77d8e8f78ba09b8", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.42823339234939867, "ground_truth": 0}, {"key": "da0ea6b7eae20528c7ec822fb77d8e8f78ba09b8", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.6460136858014875, "ground_truth": 0}, {"key": "da0ea6b7eae20528c7ec822fb77d8e8f78ba09b8", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.6825737319781341, "ground_truth": 0}, {"key": "42ab0385b3bb93236804c2abc9ff261b6ec79872", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.19806416704384613, "ground_truth": 0}, {"key": "42ab0385b3bb93236804c2abc9ff261b6ec79872", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.11757213288760195, "ground_truth": 0}, {"key": "42ab0385b3bb93236804c2abc9ff261b6ec79872", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.25832598179444155, "ground_truth": 0}, {"key": "42ab0385b3bb93236804c2abc9ff261b6ec79872", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.2479874408953845, "ground_truth": 0}, {"key": "42ab0385b3bb93236804c2abc9ff261b6ec79872", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.20946969906107338, "ground_truth": 0}, {"key": "3ad31f0dd26f2dce06da1c10ced8d601bd5594c5", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.36840572132765725, "ground_truth": 0}, {"key": "3ad31f0dd26f2dce06da1c10ced8d601bd5594c5", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.39606816997660405, "ground_truth": 0}, {"key": "3ad31f0dd26f2dce06da1c10ced8d601bd5594c5", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.26133092132846736, "ground_truth": 0}, {"key": "3ad31f0dd26f2dce06da1c10ced8d601bd5594c5", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.20181321997333543, "ground_truth": 0}, {"key": "3ad31f0dd26f2dce06da1c10ced8d601bd5594c5", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.44939262106624983, "ground_truth": 0}, {"key": "a142b867b5b52449a790e8a2942654fd880cd2e4", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.383064156079556, "ground_truth": 0}, {"key": "a142b867b5b52449a790e8a2942654fd880cd2e4", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.6477982245785191, "ground_truth": 0}, {"key": "a142b867b5b52449a790e8a2942654fd880cd2e4", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.3123700176517715, "ground_truth": 0}, {"key": "a142b867b5b52449a790e8a2942654fd880cd2e4", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.24364241512425014, "ground_truth": 0}, {"key": "a142b867b5b52449a790e8a2942654fd880cd2e4", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.42632160206341363, "ground_truth": 0}, {"key": "04b39ee42fdc4284e402fbf7cdc7b825748f38b5", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.5136684540770592, "ground_truth": 0}, {"key": "04b39ee42fdc4284e402fbf7cdc7b825748f38b5", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.3942009459151213, "ground_truth": 0}, {"key": "04b39ee42fdc4284e402fbf7cdc7b825748f38b5", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.6531269134162683, "ground_truth": 0}, {"key": "04b39ee42fdc4284e402fbf7cdc7b825748f38b5", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.24798742119831008, "ground_truth": 0}, {"key": "04b39ee42fdc4284e402fbf7cdc7b825748f38b5", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.6424324934315405, "ground_truth": 0}, {"key": "ddafab36467762e9f1856687a7ef0e801243dace", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.16559311084518, "ground_truth": 0}, {"key": "ddafab36467762e9f1856687a7ef0e801243dace", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.5506073663352307, "ground_truth": 0}, {"key": "ddafab36467762e9f1856687a7ef0e801243dace", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.30902370557208547, "ground_truth": 0}, {"key": "ddafab36467762e9f1856687a7ef0e801243dace", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.16667539606208231, "ground_truth": 0}, {"key": "ddafab36467762e9f1856687a7ef0e801243dace", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.2267836313021726, "ground_truth": 0}, {"key": "6c177720c8623edcaefc45111018f98811c29693", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.5234203501805337, "ground_truth": 0}, {"key": "6c177720c8623edcaefc45111018f98811c29693", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.5078118670497619, "ground_truth": 0}, {"key": "6c177720c8623edcaefc45111018f98811c29693", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.6352224239082535, "ground_truth": 0}, {"key": "6c177720c8623edcaefc45111018f98811c29693", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.48047868240364977, "ground_truth": 0}, {"key": "6c177720c8623edcaefc45111018f98811c29693", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.3830641946782162, "ground_truth": 0}, {"key": "5365dfc7c7079ade7d090530f5ce0d8995a8f1cc", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.23934933480030293, "ground_truth": 0}, {"key": "5365dfc7c7079ade7d090530f5ce0d8995a8f1cc", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.4416729882109183, "ground_truth": 0}, {"key": "5365dfc7c7079ade7d090530f5ce0d8995a8f1cc", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.3040416864848522, "ground_truth": 0}, {"key": "5365dfc7c7079ade7d090530f5ce0d8995a8f1cc", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.39420094158717267, "ground_truth": 0}, {"key": "5365dfc7c7079ade7d090530f5ce0d8995a8f1cc", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.3208213287991848, "ground_truth": 0}, {"key": "6235695e9e69aa35c488636fc63bae84d1e2ca1f", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.31573597853540347, "ground_truth": 0}, {"key": "6235695e9e69aa35c488636fc63bae84d1e2ca1f", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.2735743930061615, "ground_truth": 0}, {"key": "6235695e9e69aa35c488636fc63bae84d1e2ca1f", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.12421300289685185, "ground_truth": 0}, {"key": "6235695e9e69aa35c488636fc63bae84d1e2ca1f", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.2213507037668293, "ground_truth": 0}, {"key": "6235695e9e69aa35c488636fc63bae84d1e2ca1f", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.2704802343192195, "ground_truth": 0}, {"key": "d954f33da49f4c839a6f4dadc446a4c30328c572", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.44552954234406694, "ground_truth": 0}, {"key": "d954f33da49f4c839a6f4dadc446a4c30328c572", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.6808786262125001, "ground_truth": 0}, {"key": "d954f33da49f4c839a6f4dadc446a4c30328c572", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.48242912880836286, "ground_truth": 0}, {"key": "d954f33da49f4c839a6f4dadc446a4c30328c572", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.31573599531271945, "ground_truth": 0}, {"key": "d954f33da49f4c839a6f4dadc446a4c30328c572", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.33982762689106855, "ground_truth": 0}, {"key": "5bdab1456ce6156a7378edaa4fa92a718cbf2568", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.6424324826697346, "ground_truth": 0}, {"key": "5bdab1456ce6156a7378edaa4fa92a718cbf2568", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.4320633968879742, "ground_truth": 0}, {"key": "5bdab1456ce6156a7378edaa4fa92a718cbf2568", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.39606817448150905, "ground_truth": 0}, {"key": "5bdab1456ce6156a7378edaa4fa92a718cbf2568", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.24798744260347477, "ground_truth": 0}, {"key": "5bdab1456ce6156a7378edaa4fa92a718cbf2568", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.28616926008912486, "ground_truth": 0}, {"key": "c03cd67baa8d84240b962876a5aaa2036d4f5275", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.2365162336229364, "ground_truth": 0}, {"key": "c03cd67baa8d84240b962876a5aaa2036d4f5275", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.1216857448411662, "ground_truth": 0}, {"key": "c03cd67baa8d84240b962876a5aaa2036d4f5275", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.19806417154171807, "ground_truth": 0}, {"key": "c03cd67baa8d84240b962876a5aaa2036d4f5275", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.25832598507009535, "ground_truth": 0}, {"key": "c03cd67baa8d84240b962876a5aaa2036d4f5275", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.36477754314235233, "ground_truth": 0}, {"key": "e2847808e1990f51cd54eccd660640c44638f088", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.0881900465109827, "ground_truth": 0}, {"key": "e2847808e1990f51cd54eccd660640c44638f088", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.3398276321406256, "ground_truth": 0}, {"key": "e2847808e1990f51cd54eccd660640c44638f088", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.18359362707552077, "ground_truth": 0}, {"key": "e2847808e1990f51cd54eccd660640c44638f088", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.14903529200077104, "ground_truth": 0}, {"key": "e2847808e1990f51cd54eccd660640c44638f088", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.6566582571107383, "ground_truth": 0}, {"key": "fbc2d5f3f088eda2b8128ebb12a042850f6e4f3d", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.3720487939268357, "ground_truth": 0}, {"key": "fbc2d5f3f088eda2b8128ebb12a042850f6e4f3d", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.3363310546320584, "ground_truth": 0}, {"key": "fbc2d5f3f088eda2b8128ebb12a042850f6e4f3d", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.27825679257404584, "ground_truth": 0}, {"key": "fbc2d5f3f088eda2b8128ebb12a042850f6e4f3d", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.34158249425394877, "ground_truth": 0}, {"key": "fbc2d5f3f088eda2b8128ebb12a042850f6e4f3d", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.5097643893179377, "ground_truth": 0}, {"key": "6f0d219aba6227e0a69e71e7fca4b85ae761101d", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.27357439442331277, "ground_truth": 0}, {"key": "6f0d219aba6227e0a69e71e7fca4b85ae761101d", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.27512973050253586, "ground_truth": 0}, {"key": "6f0d219aba6227e0a69e71e7fca4b85ae761101d", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.1623800292336212, "ground_truth": 0}, {"key": "6f0d219aba6227e0a69e71e7fca4b85ae761101d", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.201813213396038, "ground_truth": 0}, {"key": "6f0d219aba6227e0a69e71e7fca4b85ae761101d", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.1847675059038275, "ground_truth": 0}, {"key": "8c71492f2a3fbe7eb9c8205d65054ab14c1dbdb6", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.24798743910000431, "ground_truth": 0}, {"key": "8c71492f2a3fbe7eb9c8205d65054ab14c1dbdb6", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.6495786154883917, "ground_truth": 0}, {"key": "8c71492f2a3fbe7eb9c8205d65054ab14c1dbdb6", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.7905303060944727, "ground_truth": 0}, {"key": "8c71492f2a3fbe7eb9c8205d65054ab14c1dbdb6", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.48438008617416306, "ground_truth": 0}, {"key": "8c71492f2a3fbe7eb9c8205d65054ab14c1dbdb6", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.41111086246507594, "ground_truth": 0}, {"key": "860cea3a6afb8527d26e9234ccba560a39eff2a7", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.6584175018299032, "ground_truth": 0}, {"key": "860cea3a6afb8527d26e9234ccba560a39eff2a7", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.34158249108181504, "ground_truth": 0}, {"key": "860cea3a6afb8527d26e9234ccba560a39eff2a7", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.4186969125810912, "ground_truth": 0}, {"key": "860cea3a6afb8527d26e9234ccba560a39eff2a7", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.5312093652327127, "ground_truth": 0}, {"key": "860cea3a6afb8527d26e9234ccba560a39eff2a7", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.3720487963146677, "ground_truth": 0}, {"key": "0914e3c80a676e14e225504cb759103503f3f1e0", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.7662936525787755, "ground_truth": 0}, {"key": "0914e3c80a676e14e225504cb759103503f3f1e0", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.8354835358009507, "ground_truth": 0}, {"key": "0914e3c80a676e14e225504cb759103503f3f1e0", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.7931059353471495, "ground_truth": 0}, {"key": "0914e3c80a676e14e225504cb759103503f3f1e0", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.6406358738163835, "ground_truth": 0}, {"key": "0914e3c80a676e14e225504cb759103503f3f1e0", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.8774767856677379, "ground_truth": 0}, {"key": "82a0e1f034174079179821b052f33df76c781b47", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.4474603097701912, "ground_truth": 0}, {"key": "82a0e1f034174079179821b052f33df76c781b47", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.4320634070285256, "ground_truth": 0}, {"key": "82a0e1f034174079179821b052f33df76c781b47", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.2814055924459507, "ground_truth": 0}, {"key": "82a0e1f034174079179821b052f33df76c781b47", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.42250463247472925, "ground_truth": 0}, {"key": "82a0e1f034174079179821b052f33df76c781b47", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.21866937434653175, "ground_truth": 0}, {"key": "449c536051eba7070b18a7b33ebcf024891cb913", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.6095241655741632, "ground_truth": 0}, {"key": "449c536051eba7070b18a7b33ebcf024891cb913", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.6442251124628035, "ground_truth": 0}, {"key": "449c536051eba7070b18a7b33ebcf024891cb913", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.30404167614288924, "ground_truth": 0}, {"key": "449c536051eba7070b18a7b33ebcf024891cb913", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.16776334533896078, "ground_truth": 0}, {"key": "449c536051eba7070b18a7b33ebcf024891cb913", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.23934934243191314, "ground_truth": 0}, {"key": "696d5716c42ab1096cdb464da3cfcf702626a62a", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.7732163781281068, "ground_truth": 0}, {"key": "696d5716c42ab1096cdb464da3cfcf702626a62a", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.7563575515178041, "ground_truth": 0}, {"key": "696d5716c42ab1096cdb464da3cfcf702626a62a", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.5602526654153688, "ground_truth": 0}, {"key": "696d5716c42ab1096cdb464da3cfcf702626a62a", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.7799929028284227, "ground_truth": 0}, {"key": "696d5716c42ab1096cdb464da3cfcf702626a62a", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.8278281454496039, "ground_truth": 0}, {"key": "316f0f847800fdb547f7496f6095075cd610c7e4", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.9073122205812656, "ground_truth": 0}, {"key": "316f0f847800fdb547f7496f6095075cd610c7e4", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.9518632276364819, "ground_truth": 0}, {"key": "316f0f847800fdb547f7496f6095075cd610c7e4", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.816406369411459, "ground_truth": 0}, {"key": "316f0f847800fdb547f7496f6095075cd610c7e4", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.9273632924140559, "ground_truth": 0}, {"key": "316f0f847800fdb547f7496f6095075cd610c7e4", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.8365545664046294, "ground_truth": 0}, {"key": "28e251ea722829df08d63e83824110fedcc13f8c", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.6654105664158239, "ground_truth": 0}, {"key": "28e251ea722829df08d63e83824110fedcc13f8c", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.26894144099398354, "ground_truth": 0}, {"key": "28e251ea722829df08d63e83824110fedcc13f8c", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.5813030882623911, "ground_truth": 0}, {"key": "28e251ea722829df08d63e83824110fedcc13f8c", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.3311197373624492, "ground_truth": 0}, {"key": "28e251ea722829df08d63e83824110fedcc13f8c", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.6531269148794097, "ground_truth": 0}, {"key": "4812698545d6a4c2243db340fad08d0b3b7fbe0b", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.2583259751377769, "ground_truth": 0}, {"key": "4812698545d6a4c2243db340fad08d0b3b7fbe0b", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.17667159827689083, "ground_truth": 0}, {"key": "4812698545d6a4c2243db340fad08d0b3b7fbe0b", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.26894144502352646, "ground_truth": 0}, {"key": "4812698545d6a4c2243db340fad08d0b3b7fbe0b", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.16776333864303844, "ground_truth": 0}, {"key": "4812698545d6a4c2243db340fad08d0b3b7fbe0b", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.31237001058988667, "ground_truth": 0}, {"key": "81651fc015f2db10f24327d11b1a3748a19466f9", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.3923368374117139, "ground_truth": 0}, {"key": "81651fc015f2db10f24327d11b1a3748a19466f9", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.1801066670711757, "ground_truth": 0}, {"key": "81651fc015f2db10f24327d11b1a3748a19466f9", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.31573597733587616, "ground_truth": 0}, {"key": "81651fc015f2db10f24327d11b1a3748a19466f9", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.3174262862145586, "ground_truth": 0}, {"key": "81651fc015f2db10f24327d11b1a3748a19466f9", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.198064174830384, "ground_truth": 0}, {"key": "f85e12129885fad0eabd6a1c6b6b24dbf8948db5", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.2861692646523755, "ground_truth": 0}, {"key": "f85e12129885fad0eabd6a1c6b6b24dbf8948db5", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.47073659992695654, "ground_truth": 0}, {"key": "f85e12129885fad0eabd6a1c6b6b24dbf8948db5", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.3629691933509101, "ground_truth": 0}, {"key": "f85e12129885fad0eabd6a1c6b6b24dbf8948db5", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.24508501102576213, "ground_truth": 0}, {"key": "f85e12129885fad0eabd6a1c6b6b24dbf8948db5", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.24364246266177833, "ground_truth": 0}, {"key": "bffa402002700855fec36f83c8c226dfe271a6af", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.5175708973077732, "ground_truth": 0}, {"key": "bffa402002700855fec36f83c8c226dfe271a6af", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.5019530959427735, "ground_truth": 0}, {"key": "bffa402002700855fec36f83c8c226dfe271a6af", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.43206337286116314, "ground_truth": 0}, {"key": "bffa402002700855fec36f83c8c226dfe271a6af", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.37937835525724495, "ground_truth": 0}, {"key": "bffa402002700855fec36f83c8c226dfe271a6af", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.5, "ground_truth": 0}, {"key": "360df256327edcaf7ce0b99314adec8b0a2c5be6", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.9429286031267844, "ground_truth": 0}, {"key": "360df256327edcaf7ce0b99314adec8b0a2c5be6", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.9420819149365496, "ground_truth": 0}, {"key": "360df256327edcaf7ce0b99314adec8b0a2c5be6", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.6150878573763369, "ground_truth": 0}, {"key": "360df256327edcaf7ce0b99314adec8b0a2c5be6", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.4551986272894675, "ground_truth": 0}, {"key": "360df256327edcaf7ce0b99314adec8b0a2c5be6", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.8104789081531948, "ground_truth": 0}, {"key": "35ae4229bbd571d86bb817df03b3784dc8cbf660", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.2658804803978354, "ground_truth": 0}, {"key": "35ae4229bbd571d86bb817df03b3784dc8cbf660", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.6460136996875507, "ground_truth": 0}, {"key": "35ae4229bbd571d86bb817df03b3784dc8cbf660", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.43206338346161194, "ground_truth": 0}, {"key": "35ae4229bbd571d86bb817df03b3784dc8cbf660", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.2479874388153995, "ground_truth": 0}, {"key": "35ae4229bbd571d86bb817df03b3784dc8cbf660", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.6076631850660232, "ground_truth": 0}, {"key": "fd93b423a3805de1c259d527393fd5fb75d06a55", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.4551986001844127, "ground_truth": 0}, {"key": "fd93b423a3805de1c259d527393fd5fb75d06a55", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.5078118655030328, "ground_truth": 0}, {"key": "fd93b423a3805de1c259d527393fd5fb75d06a55", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.07640768162137923, "ground_truth": 0}, {"key": "fd93b423a3805de1c259d527393fd5fb75d06a55", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.16238002463145396, "ground_truth": 0}, {"key": "fd93b423a3805de1c259d527393fd5fb75d06a55", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.16885696485290894, "ground_truth": 0}, {"key": "646676aabe72e75add3cde2d6afa56cea64c91a4", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.25386101145783313, "ground_truth": 0}, {"key": "646676aabe72e75add3cde2d6afa56cea64c91a4", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.5331543978402287, "ground_truth": 0}, {"key": "646676aabe72e75add3cde2d6afa56cea64c91a4", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.8661325175553461, "ground_truth": 0}, {"key": "646676aabe72e75add3cde2d6afa56cea64c91a4", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.4263215594382755, "ground_truth": 0}, {"key": "646676aabe72e75add3cde2d6afa56cea64c91a4", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.30239107150788447, "ground_truth": 0}, {"key": "5acf12b2ef7771fd1cd1421acb7057d9a64be818", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.3276682983786216, "ground_truth": 0}, {"key": "5acf12b2ef7771fd1cd1421acb7057d9a64be818", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.2974699548720334, "ground_truth": 0}, {"key": "5acf12b2ef7771fd1cd1421acb7057d9a64be818", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.09670578621032205, "ground_truth": 0}, {"key": "5acf12b2ef7771fd1cd1421acb7057d9a64be818", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.11838510116130904, "ground_truth": 0}, {"key": "5acf12b2ef7771fd1cd1421acb7057d9a64be818", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.42441202039316395, "ground_truth": 0}, {"key": "0239342f05436085947bd0c5173a4636ee772b51", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.22678363848747243, "ground_truth": 0}, {"key": "0239342f05436085947bd0c5173a4636ee772b51", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.22135069203357396, "ground_truth": 0}, {"key": "0239342f05436085947bd0c5173a4636ee772b51", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.09947021182207574, "ground_truth": 0}, {"key": "0239342f05436085947bd0c5173a4636ee772b51", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.13386748521008984, "ground_truth": 0}, {"key": "0239342f05436085947bd0c5173a4636ee772b51", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.3757064738427785, "ground_truth": 0}, {"key": "1f40e358077ff22078a4e91e5114c4f86a4d52db", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.3106943983578206, "ground_truth": 0}, {"key": "1f40e358077ff22078a4e91e5114c4f86a4d52db", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.19436781193785094, "ground_truth": 0}, {"key": "1f40e358077ff22078a4e91e5114c4f86a4d52db", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.22953521872882318, "ground_truth": 0}, {"key": "1f40e358077ff22078a4e91e5114c4f86a4d52db", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.18242553450067617, "ground_truth": 0}, {"key": "1f40e358077ff22078a4e91e5114c4f86a4d52db", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.3629691856508831, "ground_truth": 0}, {"key": "a8ac682f29acaad4b669781c39fb2804374b8b2b", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.11047114431993706, "ground_truth": 0}, {"key": "a8ac682f29acaad4b669781c39fb2804374b8b2b", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.2613309238398994, "ground_truth": 0}, {"key": "a8ac682f29acaad4b669781c39fb2804374b8b2b", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.2583259754108441, "ground_truth": 0}, {"key": "a8ac682f29acaad4b669781c39fb2804374b8b2b", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.33111974368950886, "ground_truth": 0}, {"key": "a8ac682f29acaad4b669781c39fb2804374b8b2b", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.16344543489300126, "ground_truth": 0}, {"key": "d4474ce9da725c1540ac826f3247f53d086808fb", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.4493926293737664, "ground_truth": 0}, {"key": "d4474ce9da725c1540ac826f3247f53d086808fb", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.4980469066039486, "ground_truth": 0}, {"key": "d4474ce9da725c1540ac826f3247f53d086808fb", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.32766829214969223, "ground_truth": 0}, {"key": "d4474ce9da725c1540ac826f3247f53d086808fb", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.405448736803984, "ground_truth": 0}, {"key": "d4474ce9da725c1540ac826f3247f53d086808fb", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.503906179959704, "ground_truth": 0}, {"key": "e74db6d20c456740ecb7b295c8d24489fb4f436f", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.19559407716861757, "ground_truth": 0}, {"key": "e74db6d20c456740ecb7b295c8d24489fb4f436f", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.3557748776246588, "ground_truth": 0}, {"key": "e74db6d20c456740ecb7b295c8d24489fb4f436f", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.24653333811088032, "ground_truth": 0}, {"key": "e74db6d20c456740ecb7b295c8d24489fb4f436f", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.17667160253523403, "ground_truth": 0}, {"key": "e74db6d20c456740ecb7b295c8d24489fb4f436f", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.3830641772400293, "ground_truth": 0}, {"key": "d79b790edcc3f5088161445102a656ae4adb8ab1", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.9202179905336219, "ground_truth": 0}, {"key": "d79b790edcc3f5088161445102a656ae4adb8ab1", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.9637799406186451, "ground_truth": 0}, {"key": "d79b790edcc3f5088161445102a656ae4adb8ab1", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.9559813486047343, "ground_truth": 0}, {"key": "d79b790edcc3f5088161445102a656ae4adb8ab1", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.874077234354135, "ground_truth": 0}, {"key": "d79b790edcc3f5088161445102a656ae4adb8ab1", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.9268352775175231, "ground_truth": 0}, {"key": "47f028dbf53e028eb6636c85d8b3ee0de6a1de7b", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.5312093700355683, "ground_truth": 0}, {"key": "47f028dbf53e028eb6636c85d8b3ee0de6a1de7b", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.5234203153649069, "ground_truth": 0}, {"key": "47f028dbf53e028eb6636c85d8b3ee0de6a1de7b", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.25238407203171903, "ground_truth": 0}, {"key": "47f028dbf53e028eb6636c85d8b3ee0de6a1de7b", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.139396389152895, "ground_truth": 0}, {"key": "47f028dbf53e028eb6636c85d8b3ee0de6a1de7b", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.32082130192556413, "ground_truth": 0}, {"key": "5f7a869908e864b70e83282b289ed1274c1f7f0d", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.4610167747363897, "ground_truth": 0}, {"key": "5f7a869908e864b70e83282b289ed1274c1f7f0d", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.5813030901250207, "ground_truth": 0}, {"key": "5f7a869908e864b70e83282b289ed1274c1f7f0d", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.40922080256256194, "ground_truth": 0}, {"key": "5f7a869908e864b70e83282b289ed1274c1f7f0d", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.3398276235417699, "ground_truth": 0}, {"key": "5f7a869908e864b70e83282b289ed1274c1f7f0d", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.5097643826268022, "ground_truth": 0}, {"key": "59a9e7cad1c4c873738dda62b7e7b39bc2553710", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.5717666136595582, "ground_truth": 0}, {"key": "59a9e7cad1c4c873738dda62b7e7b39bc2553710", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.23934933521717153, "ground_truth": 0}, {"key": "59a9e7cad1c4c873738dda62b7e7b39bc2553710", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.8031737896039579, "ground_truth": 0}, {"key": "59a9e7cad1c4c873738dda62b7e7b39bc2553710", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.5794003929862628, "ground_truth": 0}, {"key": "59a9e7cad1c4c873738dda62b7e7b39bc2553710", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.4436004342081981, "ground_truth": 0}, {"key": "c47db89f5f9de3e599e2947ab7940eb65be0b433", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.4765796403914896, "ground_truth": 0}, {"key": "c47db89f5f9de3e599e2947ab7940eb65be0b433", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.3611647258088386, "ground_truth": 0}, {"key": "c47db89f5f9de3e599e2947ab7940eb65be0b433", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.4941409027471309, "ground_truth": 0}, {"key": "c47db89f5f9de3e599e2947ab7940eb65be0b433", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.5156199169589814, "ground_truth": 0}, {"key": "c47db89f5f9de3e599e2947ab7940eb65be0b433", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.36477756900505387, "ground_truth": 0}, {"key": "a74c3ff540cb154fc1294fd9d48b6a952329722b", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.11201595142735828, "ground_truth": 0}, {"key": "a74c3ff540cb154fc1294fd9d48b6a952329722b", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.5869964334434938, "ground_truth": 0}, {"key": "a74c3ff540cb154fc1294fd9d48b6a952329722b", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.6370308136793356, "ground_truth": 0}, {"key": "a74c3ff540cb154fc1294fd9d48b6a952329722b", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.19193279566116975, "ground_truth": 0}, {"key": "a74c3ff540cb154fc1294fd9d48b6a952329722b", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.292595326906889, "ground_truth": 0}, {"key": "f5692f8e01389a631dadcb70cfd4be3ff0ae45d3", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.4726834614728234, "ground_truth": 0}, {"key": "f5692f8e01389a631dadcb70cfd4be3ff0ae45d3", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.4668456259884597, "ground_truth": 0}, {"key": "f5692f8e01389a631dadcb70cfd4be3ff0ae45d3", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.27825677793890435, "ground_truth": 0}, {"key": "f5692f8e01389a631dadcb70cfd4be3ff0ae45d3", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.2643583379637875, "ground_truth": 0}, {"key": "f5692f8e01389a631dadcb70cfd4be3ff0ae45d3", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.386763451607206, "ground_truth": 0}, {"key": "467e1b592518a5660d0a3b7eda24ef9574fe0d11", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.4359015256454367, "ground_truth": 0}, {"key": "467e1b592518a5660d0a3b7eda24ef9574fe0d11", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.3629691868352026, "ground_truth": 0}, {"key": "467e1b592518a5660d0a3b7eda24ef9574fe0d11", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.5544704729316466, "ground_truth": 0}, {"key": "467e1b592518a5660d0a3b7eda24ef9574fe0d11", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.3886180205577896, "ground_truth": 0}, {"key": "467e1b592518a5660d0a3b7eda24ef9574fe0d11", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.3345894423524438, "ground_truth": 0}, {"key": "61acf6de75325370728f6e290bafb01adc24a3ca", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.38491216837042835, "ground_truth": 0}, {"key": "61acf6de75325370728f6e290bafb01adc24a3ca", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.6424324890438122, "ground_truth": 0}, {"key": "61acf6de75325370728f6e290bafb01adc24a3ca", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.44360044482239813, "ground_truth": 0}, {"key": "61acf6de75325370728f6e290bafb01adc24a3ca", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.16995623718875508, "ground_truth": 0}, {"key": "61acf6de75325370728f6e290bafb01adc24a3ca", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.3720487872642508, "ground_truth": 0}, {"key": "172d2668b011501c20181b4925ebb6ba582f9a2f", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.5869964267470369, "ground_truth": 0}, {"key": "172d2668b011501c20181b4925ebb6ba582f9a2f", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.4863315283805316, "ground_truth": 0}, {"key": "172d2668b011501c20181b4925ebb6ba582f9a2f", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.5214711681457257, "ground_truth": 0}, {"key": "172d2668b011501c20181b4925ebb6ba582f9a2f", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.3380771315470604, "ground_truth": 0}, {"key": "172d2668b011501c20181b4925ebb6ba582f9a2f", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.5117165951301006, "ground_truth": 0}, {"key": "314c7c0104eb4113074619b3b3f1e9356114e2f5", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.5945512600760455, "ground_truth": 0}, {"key": "314c7c0104eb4113074619b3b3f1e9356114e2f5", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.7690802483077609, "ground_truth": 0}, {"key": "314c7c0104eb4113074619b3b3f1e9356114e2f5", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.7090191384020422, "ground_truth": 0}, {"key": "314c7c0104eb4113074619b3b3f1e9356114e2f5", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.8056321934654725, "ground_truth": 0}, {"key": "314c7c0104eb4113074619b3b3f1e9356114e2f5", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.830043754221743, "ground_truth": 0}, {"key": "e66546893c2fa5fe38be74e1d1ed104f0c412b4d", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.637030804672211, "ground_truth": 0}, {"key": "e66546893c2fa5fe38be74e1d1ed104f0c412b4d", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.22815650567260992, "ground_truth": 0}, {"key": "e66546893c2fa5fe38be74e1d1ed104f0c412b4d", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.28776781497627246, "ground_truth": 0}, {"key": "e66546893c2fa5fe38be74e1d1ed104f0c412b4d", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.46684561988321377, "ground_truth": 0}, {"key": "e66546893c2fa5fe38be74e1d1ed104f0c412b4d", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.2295351979691739, "ground_truth": 0}, {"key": "04882672036936ca86bdebed819a133539cbd296", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.2658804760615829, "ground_truth": 0}, {"key": "04882672036936ca86bdebed819a133539cbd296", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.1441488491792712, "ground_truth": 0}, {"key": "04882672036936ca86bdebed819a133539cbd296", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.25534363637242036, "ground_truth": 0}, {"key": "04882672036936ca86bdebed819a133539cbd296", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.3023910911864995, "ground_truth": 0}, {"key": "04882672036936ca86bdebed819a133539cbd296", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.20561505902828991, "ground_truth": 0}, {"key": "d5342fb6d8d522f336f2ce34eaa6e62446c0da2e", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.5175708731809209, "ground_truth": 0}, {"key": "d5342fb6d8d522f336f2ce34eaa6e62446c0da2e", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.1294027289973123, "ground_truth": 0}, {"key": "d5342fb6d8d522f336f2ce34eaa6e62446c0da2e", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.544801378644533, "ground_truth": 0}, {"key": "d5342fb6d8d522f336f2ce34eaa6e62446c0da2e", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.531209370060674, "ground_truth": 0}, {"key": "d5342fb6d8d522f336f2ce34eaa6e62446c0da2e", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.7279754263227571, "ground_truth": 0}, {"key": "87cdc5b797032387ea9bd0c9a0d7fd57c088e65b", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.4726834832544022, "ground_truth": 0}, {"key": "87cdc5b797032387ea9bd0c9a0d7fd57c088e65b", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.28776781311274224, "ground_truth": 0}, {"key": "87cdc5b797032387ea9bd0c9a0d7fd57c088e65b", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.5214711552956582, "ground_truth": 0}, {"key": "87cdc5b797032387ea9bd0c9a0d7fd57c088e65b", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.34864513729927854, "ground_truth": 0}, {"key": "87cdc5b797032387ea9bd0c9a0d7fd57c088e65b", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.7122321752586529, "ground_truth": 0}, {"key": "4fd3285b643696cd49f08c14b0d482e559f32eed", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.12336561340147055, "ground_truth": 0}, {"key": "4fd3285b643696cd49f08c14b0d482e559f32eed", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.2643583563424618, "ground_truth": 0}, {"key": "4fd3285b643696cd49f08c14b0d482e559f32eed", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.07316471739934115, "ground_truth": 0}, {"key": "4fd3285b643696cd49f08c14b0d482e559f32eed", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.21337716848852836, "ground_truth": 0}, {"key": "4fd3285b643696cd49f08c14b0d482e559f32eed", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.1688569516685426, "ground_truth": 0}, {"key": "55930649e6f3cb285a26ef33525f8199bd86d089", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.09534946306351058, "ground_truth": 0}, {"key": "55930649e6f3cb285a26ef33525f8199bd86d089", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.14804718394980498, "ground_truth": 0}, {"key": "55930649e6f3cb285a26ef33525f8199bd86d089", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.20055768462874848, "ground_truth": 0}, {"key": "55930649e6f3cb285a26ef33525f8199bd86d089", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.22135068673491237, "ground_truth": 0}, {"key": "55930649e6f3cb285a26ef33525f8199bd86d089", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.24364245632757195, "ground_truth": 0}, {"key": "8b1c9d7c48a0d857ae857a21395a4996de051915", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.23792989224464034, "ground_truth": 0}, {"key": "8b1c9d7c48a0d857ae857a21395a4996de051915", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.24364245733811304, "ground_truth": 0}, {"key": "8b1c9d7c48a0d857ae857a21395a4996de051915", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.43206339165938246, "ground_truth": 0}, {"key": "8b1c9d7c48a0d857ae857a21395a4996de051915", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.21076628258259256, "ground_truth": 0}, {"key": "8b1c9d7c48a0d857ae857a21395a4996de051915", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.2323101642647665, "ground_truth": 0}, {"key": "d95dce003f0fccc57742bd900c81897c45208c10", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.2735744012116028, "ground_truth": 0}, {"key": "d95dce003f0fccc57742bd900c81897c45208c10", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.2925953123632868, "ground_truth": 0}, {"key": "d95dce003f0fccc57742bd900c81897c45208c10", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.2107662957853721, "ground_truth": 0}, {"key": "d95dce003f0fccc57742bd900c81897c45208c10", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.37204879414701664, "ground_truth": 0}, {"key": "d95dce003f0fccc57742bd900c81897c45208c10", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.19436782382837423, "ground_truth": 0}, {"key": "f732a658c314c090257225483075e4d9fde28b95", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.30404167478807503, "ground_truth": 0}, {"key": "f732a658c314c090257225483075e4d9fde28b95", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.48828338851955744, "ground_truth": 0}, {"key": "f732a658c314c090257225483075e4d9fde28b95", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.40356683959895157, "ground_truth": 0}, {"key": "f732a658c314c090257225483075e4d9fde28b95", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.19193278559229335, "ground_truth": 0}, {"key": "f732a658c314c090257225483075e4d9fde28b95", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.312370003213795, "ground_truth": 0}, {"key": "cbd21ed724b7e4a075ab4ae9a45d9e86d6151283", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.4397473197899619, "ground_truth": 0}, {"key": "cbd21ed724b7e4a075ab4ae9a45d9e86d6151283", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.496093828698951, "ground_truth": 0}, {"key": "cbd21ed724b7e4a075ab4ae9a45d9e86d6151283", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.29746995527288356, "ground_truth": 0}, {"key": "cbd21ed724b7e4a075ab4ae9a45d9e86d6151283", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.2120688045620478, "ground_truth": 0}, {"key": "cbd21ed724b7e4a075ab4ae9a45d9e86d6151283", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.6584174937436886, "ground_truth": 0}, {"key": "4a32d5f29cfb35f3a3966ee041fc1f358503f4b4", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.531209388513505, "ground_truth": 0}, {"key": "4a32d5f29cfb35f3a3966ee041fc1f358503f4b4", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.5467381475970939, "ground_truth": 0}, {"key": "4a32d5f29cfb35f3a3966ee041fc1f358503f4b4", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.74017436649834, "ground_truth": 0}, {"key": "4a32d5f29cfb35f3a3966ee041fc1f358503f4b4", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.7704647839731004, "ground_truth": 0}, {"key": "4a32d5f29cfb35f3a3966ee041fc1f358503f4b4", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.5755880115888956, "ground_truth": 0}, {"key": "d470c9860671ae720ccc7df115a46d471b4b900a", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.43974733655232623, "ground_truth": 0}, {"key": "d470c9860671ae720ccc7df115a46d471b4b900a", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.5964331342401297, "ground_truth": 0}, {"key": "d470c9860671ae720ccc7df115a46d471b4b900a", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.5907791966549231, "ground_truth": 0}, {"key": "d470c9860671ae720ccc7df115a46d471b4b900a", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.5234203561920242, "ground_truth": 0}, {"key": "d470c9860671ae720ccc7df115a46d471b4b900a", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.6688802681759102, "ground_truth": 0}, {"key": "55327ce32c4d5168e8e0fa7b5dabc9a8aafd9d78", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.23510837811578567, "ground_truth": 0}, {"key": "55327ce32c4d5168e8e0fa7b5dabc9a8aafd9d78", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.16132023296580938, "ground_truth": 0}, {"key": "55327ce32c4d5168e8e0fa7b5dabc9a8aafd9d78", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.10087861360825674, "ground_truth": 0}, {"key": "55327ce32c4d5168e8e0fa7b5dabc9a8aafd9d78", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.1666753983239126, "ground_truth": 0}, {"key": "55327ce32c4d5168e8e0fa7b5dabc9a8aafd9d78", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.45132650627556964, "ground_truth": 0}, {"key": "022c18def42072e28a37979c622c6ab7e31371de", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.11516223279785372, "ground_truth": 0}, {"key": "022c18def42072e28a37979c622c6ab7e31371de", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.3504213765729344, "ground_truth": 0}, {"key": "022c18def42072e28a37979c622c6ab7e31371de", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.49414088948008067, "ground_truth": 0}, {"key": "022c18def42072e28a37979c622c6ab7e31371de", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.26740816054094535, "ground_truth": 0}, {"key": "022c18def42072e28a37979c622c6ab7e31371de", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.2720245459750867, "ground_truth": 0}, {"key": "d49c8ddc7586fcc27a7d310a5cb7703f19e4607d", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.689305600960456, "ground_truth": 0}, {"key": "d49c8ddc7586fcc27a7d310a5cb7703f19e4607d", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.5563995814499235, "ground_truth": 0}, {"key": "d49c8ddc7586fcc27a7d310a5cb7703f19e4607d", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.718594384732631, "ground_truth": 0}, {"key": "d49c8ddc7586fcc27a7d310a5cb7703f19e4607d", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.381219582717062, "ground_truth": 0}, {"key": "d49c8ddc7586fcc27a7d310a5cb7703f19e4607d", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.42823336960049135, "ground_truth": 0}, {"key": "bda116dccb075585a67fd5dd5b759015c7577eb0", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.2379298900791561, "ground_truth": 0}, {"key": "bda116dccb075585a67fd5dd5b759015c7577eb0", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.3433417356473869, "ground_truth": 0}, {"key": "bda116dccb075585a67fd5dd5b759015c7577eb0", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.08819004686527646, "ground_truth": 0}, {"key": "bda116dccb075585a67fd5dd5b759015c7577eb0", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.480478667857783, "ground_truth": 0}, {"key": "bda116dccb075585a67fd5dd5b759015c7577eb0", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.3684056995776313, "ground_truth": 0}, {"key": "ee0b1bc5ee40697c0792e3906000fe8be5be182a", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.18242553164490355, "ground_truth": 0}, {"key": "ee0b1bc5ee40697c0792e3906000fe8be5be182a", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.22953520926045584, "ground_truth": 0}, {"key": "ee0b1bc5ee40697c0792e3906000fe8be5be182a", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.21733752063719372, "ground_truth": 0}, {"key": "ee0b1bc5ee40697c0792e3906000fe8be5be182a", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.1721718533540111, "ground_truth": 0}, {"key": "ee0b1bc5ee40697c0792e3906000fe8be5be182a", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.1666754005009344, "ground_truth": 0}, {"key": "75b0d4c21581a1b0c1fc5798adba334d8ecc34f3", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.46684560126229335, "ground_truth": 0}, {"key": "75b0d4c21581a1b0c1fc5798adba334d8ecc34f3", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.6442251125784202, "ground_truth": 0}, {"key": "75b0d4c21581a1b0c1fc5798adba334d8ecc34f3", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.5563995767214931, "ground_truth": 0}, {"key": "75b0d4c21581a1b0c1fc5798adba334d8ecc34f3", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.38676344963578535, "ground_truth": 0}, {"key": "75b0d4c21581a1b0c1fc5798adba334d8ecc34f3", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.35756751879667487, "ground_truth": 0}, {"key": "3f7e19cffef13f356e2298c5a63e6c8db20f3d91", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.26588047639361945, "ground_truth": 0}, {"key": "3f7e19cffef13f356e2298c5a63e6c8db20f3d91", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.5039061396197263, "ground_truth": 0}, {"key": "3f7e19cffef13f356e2298c5a63e6c8db20f3d91", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.25091278383559956, "ground_truth": 0}, {"key": "3f7e19cffef13f356e2298c5a63e6c8db20f3d91", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.651354854651988, "ground_truth": 0}, {"key": "3f7e19cffef13f356e2298c5a63e6c8db20f3d91", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.32082131153143006, "ground_truth": 0}, {"key": "00359f516cdf8b1800c7102711bd9aa400d1c749", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.8300437632857517, "ground_truth": 0}, {"key": "00359f516cdf8b1800c7102711bd9aa400d1c749", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.6943026716022057, "ground_truth": 0}, {"key": "00359f516cdf8b1800c7102711bd9aa400d1c749", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.8679338415762418, "ground_truth": 0}, {"key": "00359f516cdf8b1800c7102711bd9aa400d1c749", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.4111108681415613, "ground_truth": 0}, {"key": "00359f516cdf8b1800c7102711bd9aa400d1c749", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.6723317075117429, "ground_truth": 0}, {"key": "f8be2f5ce06cb4af91cbb7b6bef9835991751ef5", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.476579654131163, "ground_truth": 0}, {"key": "f8be2f5ce06cb4af91cbb7b6bef9835991751ef5", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.16451645625583622, "ground_truth": 0}, {"key": "f8be2f5ce06cb4af91cbb7b6bef9835991751ef5", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.19682620357806702, "ground_truth": 0}, {"key": "f8be2f5ce06cb4af91cbb7b6bef9835991751ef5", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.1613202400570085, "ground_truth": 0}, {"key": "f8be2f5ce06cb4af91cbb7b6bef9835991751ef5", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.29746995981059027, "ground_truth": 0}, {"key": "958a67b8550998886478275b404e2256a6b85c7c", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.34334174230965825, "ground_truth": 0}, {"key": "958a67b8550998886478275b404e2256a6b85c7c", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.19930801159369851, "ground_truth": 0}, {"key": "958a67b8550998886478275b404e2256a6b85c7c", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.3468730806731496, "ground_truth": 0}, {"key": "958a67b8550998886478275b404e2256a6b85c7c", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.4092207845587112, "ground_truth": 0}, {"key": "958a67b8550998886478275b404e2256a6b85c7c", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.38121956962963216, "ground_truth": 0}, {"key": "4739f160c87994f52e894591194f5df06fed4c39", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.32766829443384077, "ground_truth": 0}, {"key": "4739f160c87994f52e894591194f5df06fed4c39", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.17553807010457817, "ground_truth": 0}, {"key": "4739f160c87994f52e894591194f5df06fed4c39", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.28616925692832457, "ground_truth": 0}, {"key": "4739f160c87994f52e894591194f5df06fed4c39", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.17553806498877933, "ground_truth": 0}, {"key": "4739f160c87994f52e894591194f5df06fed4c39", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.1510278125640225, "ground_truth": 0}, {"key": "027a99a889b38fdb935cd14c204a5fca8a329bc1", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.38491212370400446, "ground_truth": 0}, {"key": "027a99a889b38fdb935cd14c204a5fca8a329bc1", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.3593641537554022, "ground_truth": 0}, {"key": "027a99a889b38fdb935cd14c204a5fca8a329bc1", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.35936413754272073, "ground_truth": 0}, {"key": "027a99a889b38fdb935cd14c204a5fca8a329bc1", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.2974699364572055, "ground_truth": 0}, {"key": "027a99a889b38fdb935cd14c204a5fca8a329bc1", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.3293917057449528, "ground_truth": 0}, {"key": "c7c83a9ee902e568a55898c616f20181952ce057", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.35756751951028287, "ground_truth": 0}, {"key": "c7c83a9ee902e568a55898c616f20181952ce057", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.44746029151248307, "ground_truth": 0}, {"key": "c7c83a9ee902e568a55898c616f20181952ce057", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.45713673585808895, "ground_truth": 0}, {"key": "c7c83a9ee902e568a55898c616f20181952ce057", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.37204879955914877, "ground_truth": 0}, {"key": "c7c83a9ee902e568a55898c616f20181952ce057", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.2295352050613976, "ground_truth": 0}, {"key": "7bff6a60ff0b62855bd28562bb820233c0c940e0", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.7217431910909408, "ground_truth": 0}, {"key": "7bff6a60ff0b62855bd28562bb820233c0c940e0", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.7008947904551429, "ground_truth": 0}, {"key": "7bff6a60ff0b62855bd28562bb820233c0c940e0", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.3942009691490709, "ground_truth": 0}, {"key": "7bff6a60ff0b62855bd28562bb820233c0c940e0", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.45132649183380075, "ground_truth": 0}, {"key": "7bff6a60ff0b62855bd28562bb820233c0c940e0", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.40356687092663207, "ground_truth": 0}, {"key": "5ba5e49e25610f42416b2e7ba76d7496acab0f78", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.6584174915827943, "ground_truth": 0}, {"key": "5ba5e49e25610f42416b2e7ba76d7496acab0f78", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.48047868532888566, "ground_truth": 0}, {"key": "5ba5e49e25610f42416b2e7ba76d7496acab0f78", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.6791786907334761, "ground_truth": 0}, {"key": "5ba5e49e25610f42416b2e7ba76d7496acab0f78", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.550607365512934, "ground_truth": 0}, {"key": "5ba5e49e25610f42416b2e7ba76d7496acab0f78", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.6531269233061539, "ground_truth": 0}, {"key": "0961a6a9fef7ad978ab866a57415578a49ba187f", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.33807713612957674, "ground_truth": 0}, {"key": "0961a6a9fef7ad978ab866a57415578a49ba187f", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.3867634278195732, "ground_truth": 0}, {"key": "0961a6a9fef7ad978ab866a57415578a49ba187f", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.2845760173756126, "ground_truth": 0}, {"key": "0961a6a9fef7ad978ab866a57415578a49ba187f", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.2720245647647321, "ground_truth": 0}, {"key": "0961a6a9fef7ad978ab866a57415578a49ba187f", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.4863315436802899, "ground_truth": 0}, {"key": "94148575d23050ffbedb00bddbd826d7137a4fe4", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.16132024111244694, "ground_truth": 0}, {"key": "94148575d23050ffbedb00bddbd826d7137a4fe4", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.14706453703251363, "ground_truth": 0}, {"key": "94148575d23050ffbedb00bddbd826d7137a4fe4", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.22135069051499154, "ground_truth": 0}, {"key": "94148575d23050ffbedb00bddbd826d7137a4fe4", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.3380771356455208, "ground_truth": 0}, {"key": "94148575d23050ffbedb00bddbd826d7137a4fe4", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.21733752357689287, "ground_truth": 0}, {"key": "aaa346e0be1ef1b9c2ce152c859b30e364ea3bc0", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.8519528134054968, "ground_truth": 0}, {"key": "aaa346e0be1ef1b9c2ce152c859b30e364ea3bc0", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.8697145772325839, "ground_truth": 0}, {"key": "aaa346e0be1ef1b9c2ce152c859b30e364ea3bc0", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.38491215696819026, "ground_truth": 0}, {"key": "aaa346e0be1ef1b9c2ce152c859b30e364ea3bc0", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.727975446605953, "ground_truth": 0}, {"key": "aaa346e0be1ef1b9c2ce152c859b30e364ea3bc0", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.7341195286411633, "ground_truth": 0}, {"key": "7604af04967436c4aaf0c7df8b09afcec82f5be0", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.6315943001199623, "ground_truth": 0}, {"key": "7604af04967436c4aaf0c7df8b09afcec82f5be0", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.41679666718069097, "ground_truth": 0}, {"key": "7604af04967436c4aaf0c7df8b09afcec82f5be0", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.33285233278822013, "ground_truth": 0}, {"key": "7604af04967436c4aaf0c7df8b09afcec82f5be0", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.49023560311087855, "ground_truth": 0}, {"key": "7604af04967436c4aaf0c7df8b09afcec82f5be0", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.83440688163452, "ground_truth": 0}, {"key": "1be68b94413120c0b2c7514ffd14b9cfc4413f90", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.8116760181012508, "ground_truth": 0}, {"key": "1be68b94413120c0b2c7514ffd14b9cfc4413f90", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.25683200273056817, "ground_truth": 0}, {"key": "1be68b94413120c0b2c7514ffd14b9cfc4413f90", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.540923857863525, "ground_truth": 0}, {"key": "1be68b94413120c0b2c7514ffd14b9cfc4413f90", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.3647775612322253, "ground_truth": 0}, {"key": "1be68b94413120c0b2c7514ffd14b9cfc4413f90", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.414898838416591, "ground_truth": 0}, {"key": "44fc3a2bc441a674f1ebdeabae73278977909db4", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.5926665990117345, "ground_truth": 0}, {"key": "44fc3a2bc441a674f1ebdeabae73278977909db4", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.709019118717151, "ground_truth": 0}, {"key": "44fc3a2bc441a674f1ebdeabae73278977909db4", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.7676898708052311, "ground_truth": 0}, {"key": "44fc3a2bc441a674f1ebdeabae73278977909db4", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.44552949510073037, "ground_truth": 0}, {"key": "44fc3a2bc441a674f1ebdeabae73278977909db4", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.7772998597033758, "ground_truth": 0}, {"key": "fbb06b75e3963c5a810c9f73e4dc5382fbcb7405", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.4726834817914972, "ground_truth": 0}, {"key": "fbb06b75e3963c5a810c9f73e4dc5382fbcb7405", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.5214711642379711, "ground_truth": 0}, {"key": "fbb06b75e3963c5a810c9f73e4dc5382fbcb7405", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.5679366070981486, "ground_truth": 0}, {"key": "fbb06b75e3963c5a810c9f73e4dc5382fbcb7405", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.34334173600046924, "ground_truth": 0}, {"key": "fbb06b75e3963c5a810c9f73e4dc5382fbcb7405", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.4843800917598233, "ground_truth": 0}, {"key": "551839469c1133ef4697ed435c5de192e6076858", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.4824291102228425, "ground_truth": 0}, {"key": "551839469c1133ef4697ed435c5de192e6076858", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.23510839118472152, "ground_truth": 0}, {"key": "551839469c1133ef4697ed435c5de192e6076858", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.43398146595629, "ground_truth": 0}, {"key": "551839469c1133ef4697ed435c5de192e6076858", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.3242353976550193, "ground_truth": 0}, {"key": "551839469c1133ef4697ed435c5de192e6076858", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.37570649235635256, "ground_truth": 0}, {"key": "386e149797954c4b5cd52bcad0beece29f7eb04a", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.6132365741952011, "ground_truth": 0}, {"key": "386e149797954c4b5cd52bcad0beece29f7eb04a", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.12252320838052283, "ground_truth": 0}, {"key": "386e149797954c4b5cd52bcad0beece29f7eb04a", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.19314737371017146, "ground_truth": 0}, {"key": "386e149797954c4b5cd52bcad0beece29f7eb04a", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.18476750991282356, "ground_truth": 0}, {"key": "386e149797954c4b5cd52bcad0beece29f7eb04a", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.4359015302103748, "ground_truth": 0}, {"key": "25abfd6bf83eb62bdd4daf1f542d61b54ab2871d", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.4397473491852836, "ground_truth": 0}, {"key": "25abfd6bf83eb62bdd4daf1f542d61b54ab2871d", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.571766571893089, "ground_truth": 0}, {"key": "25abfd6bf83eb62bdd4daf1f542d61b54ab2871d", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.5583269997044469, "ground_truth": 0}, {"key": "25abfd6bf83eb62bdd4daf1f542d61b54ab2871d", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.7341195356783254, "ground_truth": 0}, {"key": "25abfd6bf83eb62bdd4daf1f542d61b54ab2871d", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.6740504554417008, "ground_truth": 0}, {"key": "e5e0f9ea6381d513d4632644634d7c12e1c6c4cb", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.23091975262498016, "ground_truth": 0}, {"key": "e5e0f9ea6381d513d4632644634d7c12e1c6c4cb", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.34687307398283246, "ground_truth": 0}, {"key": "e5e0f9ea6381d513d4632644634d7c12e1c6c4cb", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.3451052826573405, "ground_truth": 0}, {"key": "e5e0f9ea6381d513d4632644634d7c12e1c6c4cb", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.47657964093477334, "ground_truth": 0}, {"key": "e5e0f9ea6381d513d4632644634d7c12e1c6c4cb", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.20307463291525765, "ground_truth": 0}, {"key": "4e660c57fb36c03622b3ff9f9d0e78a0f7b0aea9", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.1480471906318356, "ground_truth": 0}, {"key": "4e660c57fb36c03622b3ff9f9d0e78a0f7b0aea9", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.22953520945148922, "ground_truth": 0}, {"key": "4e660c57fb36c03622b3ff9f9d0e78a0f7b0aea9", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.1859472058625856, "ground_truth": 0}, {"key": "4e660c57fb36c03622b3ff9f9d0e78a0f7b0aea9", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.32252600035193457, "ground_truth": 0}, {"key": "4e660c57fb36c03622b3ff9f9d0e78a0f7b0aea9", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.27048022509456665, "ground_truth": 0}, {"key": "586458cf89c9c2ddc5a7925e275f135245f5a0fc", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.21866938149836346, "ground_truth": 0}, {"key": "586458cf89c9c2ddc5a7925e275f135245f5a0fc", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.44552955166961283, "ground_truth": 0}, {"key": "586458cf89c9c2ddc5a7925e275f135245f5a0fc", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.2351083895236306, "ground_truth": 0}, {"key": "586458cf89c9c2ddc5a7925e275f135245f5a0fc", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.6757646098740883, "ground_truth": 0}, {"key": "586458cf89c9c2ddc5a7925e275f135245f5a0fc", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.4474603113124749, "ground_truth": 0}, {"key": "8aca433d3662b6ffe76ef4026bdcd7cf784aacec", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.2798285002974071, "ground_truth": 0}, {"key": "8aca433d3662b6ffe76ef4026bdcd7cf784aacec", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.11596071519287068, "ground_truth": 0}, {"key": "8aca433d3662b6ffe76ef4026bdcd7cf784aacec", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.22270014588922016, "ground_truth": 0}, {"key": "8aca433d3662b6ffe76ef4026bdcd7cf784aacec", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.09602549068215237, "ground_truth": 0}, {"key": "8aca433d3662b6ffe76ef4026bdcd7cf784aacec", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.09073548773133214, "ground_truth": 0}, {"key": "066f8568d9c1c23ca3aeb23330123e7dd8967208", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.7704647674165389, "ground_truth": 0}, {"key": "066f8568d9c1c23ca3aeb23330123e7dd8967208", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.5755880037031302, "ground_truth": 0}, {"key": "066f8568d9c1c23ca3aeb23330123e7dd8967208", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.5058590667470031, "ground_truth": 0}, {"key": "066f8568d9c1c23ca3aeb23330123e7dd8967208", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.5964331717655055, "ground_truth": 0}, {"key": "066f8568d9c1c23ca3aeb23330123e7dd8967208", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.5907791988998725, "ground_truth": 0}, {"key": "6589398915f67576609586704d5bcca6538c4727", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.5428632651750507, "ground_truth": 0}, {"key": "6589398915f67576609586704d5bcca6538c4727", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.5544704745438921, "ground_truth": 0}, {"key": "6589398915f67576609586704d5bcca6538c4727", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.39606814352408015, "ground_truth": 0}, {"key": "6589398915f67576609586704d5bcca6538c4727", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.6636689779245288, "ground_truth": 0}, {"key": "6589398915f67576609586704d5bcca6538c4727", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.5292633735608545, "ground_truth": 0}, {"key": "cb4d9818866490b281e8f5529c9957ba366390e7", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.6424324873062746, "ground_truth": 0}, {"key": "cb4d9818866490b281e8f5529c9957ba366390e7", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.25832597045788397, "ground_truth": 0}, {"key": "cb4d9818866490b281e8f5529c9957ba366390e7", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.43206341241350427, "ground_truth": 0}, {"key": "cb4d9818866490b281e8f5529c9957ba366390e7", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.4092207958052413, "ground_truth": 0}, {"key": "cb4d9818866490b281e8f5529c9957ba366390e7", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.4130035715299044, "ground_truth": 0}, {"key": "83181eb5628b02f9af1cf8be0b9e3d7841f6f94c", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.2133771716744416, "ground_truth": 0}, {"key": "83181eb5628b02f9af1cf8be0b9e3d7841f6f94c", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.47657963937432923, "ground_truth": 0}, {"key": "83181eb5628b02f9af1cf8be0b9e3d7841f6f94c", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.46295862528570614, "ground_truth": 0}, {"key": "83181eb5628b02f9af1cf8be0b9e3d7841f6f94c", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.6671476828740431, "ground_truth": 0}, {"key": "83181eb5628b02f9af1cf8be0b9e3d7841f6f94c", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.571766589235005, "ground_truth": 0}, {"key": "addda21620885e1019305bce0cbf308b421dc0ba", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.3886180338398072, "ground_truth": 0}, {"key": "addda21620885e1019305bce0cbf308b421dc0ba", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.13660840415452982, "ground_truth": 0}, {"key": "addda21620885e1019305bce0cbf308b421dc0ba", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.19193280710529614, "ground_truth": 0}, {"key": "addda21620885e1019305bce0cbf308b421dc0ba", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.40733340488463904, "ground_truth": 0}, {"key": "addda21620885e1019305bce0cbf308b421dc0ba", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.1540575603769379, "ground_truth": 0}, {"key": "6a0a6f44de4059e1d7ef83841b3fd5e95e278ba2", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.2583259679072588, "ground_truth": 0}, {"key": "6a0a6f44de4059e1d7ef83841b3fd5e95e278ba2", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.5506073674761045, "ground_truth": 0}, {"key": "6a0a6f44de4059e1d7ef83841b3fd5e95e278ba2", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.3242353937795184, "ground_truth": 0}, {"key": "6a0a6f44de4059e1d7ef83841b3fd5e95e278ba2", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.6926419973034528, "ground_truth": 0}, {"key": "6a0a6f44de4059e1d7ef83841b3fd5e95e278ba2", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.439747347277977, "ground_truth": 0}, {"key": "b5313efdec6d9afa6f43f26378c6065fcc9c7535", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.6943026456000906, "ground_truth": 0}, {"key": "b5313efdec6d9afa6f43f26378c6065fcc9c7535", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.5097644108194588, "ground_truth": 0}, {"key": "b5313efdec6d9afa6f43f26378c6065fcc9c7535", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.33111974235988095, "ground_truth": 0}, {"key": "b5313efdec6d9afa6f43f26378c6065fcc9c7535", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.5370413848756067, "ground_truth": 0}, {"key": "b5313efdec6d9afa6f43f26378c6065fcc9c7535", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.35756753739558955, "ground_truth": 0}, {"key": "0644f27692b67af8f52f9518e29981de11684cd7", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.9235923215570293, "ground_truth": 0}, {"key": "0644f27692b67af8f52f9518e29981de11684cd7", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.837619968440442, "ground_truth": 0}, {"key": "0644f27692b67af8f52f9518e29981de11684cd7", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.916708075109772, "ground_truth": 0}, {"key": "0644f27692b67af8f52f9518e29981de11684cd7", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.9515040013728476, "ground_truth": 0}, {"key": "0644f27692b67af8f52f9518e29981de11684cd7", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.8918110481244594, "ground_truth": 0}, {"key": "19dbfe3918d9bdd7b5f1792631c5e3e424146473", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.37754067607443914, "ground_truth": 0}, {"key": "19dbfe3918d9bdd7b5f1792631c5e3e424146473", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.6992544104636426, "ground_truth": 0}, {"key": "19dbfe3918d9bdd7b5f1792631c5e3e424146473", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.18952108205660595, "ground_truth": 0}, {"key": "19dbfe3918d9bdd7b5f1792631c5e3e424146473", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.1919328034351097, "ground_truth": 0}, {"key": "19dbfe3918d9bdd7b5f1792631c5e3e424146473", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.30569731731331695, "ground_truth": 0}, {"key": "0f4fcaf8fd58c40bc31c4715cd230bb0f80f2d98", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.12765261759883084, "ground_truth": 0}, {"key": "0f4fcaf8fd58c40bc31c4715cd230bb0f80f2d98", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.13660839437621508, "ground_truth": 0}, {"key": "0f4fcaf8fd58c40bc31c4715cd230bb0f80f2d98", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.09467770531087462, "ground_truth": 0}, {"key": "0f4fcaf8fd58c40bc31c4715cd230bb0f80f2d98", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.1001722277994007, "ground_truth": 0}, {"key": "0f4fcaf8fd58c40bc31c4715cd230bb0f80f2d98", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.16026604236316025, "ground_truth": 0}, {"key": "4aa90d4a364e8bd252a2a2e57f1bb4c9dab57062", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.25534363944547134, "ground_truth": 0}, {"key": "4aa90d4a364e8bd252a2a2e57f1bb4c9dab57062", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.3486451347614203, "ground_truth": 0}, {"key": "4aa90d4a364e8bd252a2a2e57f1bb4c9dab57062", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.2107662939925511, "ground_truth": 0}, {"key": "4aa90d4a364e8bd252a2a2e57f1bb4c9dab57062", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.17667160011094876, "ground_truth": 0}, {"key": "4aa90d4a364e8bd252a2a2e57f1bb4c9dab57062", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.19930800659065714, "ground_truth": 0}, {"key": "239d0e3b504e4b9e1e6eb20eb77c8a873a2f5657", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.6279512247471669, "ground_truth": 0}, {"key": "239d0e3b504e4b9e1e6eb20eb77c8a873a2f5657", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.5097643659189539, "ground_truth": 0}, {"key": "239d0e3b504e4b9e1e6eb20eb77c8a873a2f5657", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.3923368130238988, "ground_truth": 0}, {"key": "239d0e3b504e4b9e1e6eb20eb77c8a873a2f5657", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.5097643508175582, "ground_truth": 0}, {"key": "239d0e3b504e4b9e1e6eb20eb77c8a873a2f5657", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.7106283008477161, "ground_truth": 0}, {"key": "6ef705715b84a961f971d624e9574da6a65dd3ef", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.5583269746673464, "ground_truth": 0}, {"key": "6ef705715b84a961f971d624e9574da6a65dd3ef", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.7759445373944267, "ground_truth": 0}, {"key": "6ef705715b84a961f971d624e9574da6a65dd3ef", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.6477982257773801, "ground_truth": 0}, {"key": "6ef705715b84a961f971d624e9574da6a65dd3ef", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.4493926488321523, "ground_truth": 0}, {"key": "6ef705715b84a961f971d624e9574da6a65dd3ef", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.6774740193732569, "ground_truth": 0}, {"key": "e3f24714630bd679c4b4fdb77e90f785beb1ff33", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.40733341827032105, "ground_truth": 0}, {"key": "e3f24714630bd679c4b4fdb77e90f785beb1ff33", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.47268345844724197, "ground_truth": 0}, {"key": "e3f24714630bd679c4b4fdb77e90f785beb1ff33", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.4205996124309982, "ground_truth": 0}, {"key": "e3f24714630bd679c4b4fdb77e90f785beb1ff33", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.4785288415094204, "ground_truth": 0}, {"key": "e3f24714630bd679c4b4fdb77e90f785beb1ff33", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.4921881146711334, "ground_truth": 0}, {"key": "589dc58218fe8920f0949cc7af767b6daf5018bc", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.18010666851767132, "ground_truth": 0}, {"key": "589dc58218fe8920f0949cc7af767b6daf5018bc", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.15102780399644278, "ground_truth": 0}, {"key": "589dc58218fe8920f0949cc7af767b6daf5018bc", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.4148988229272, "ground_truth": 0}, {"key": "589dc58218fe8920f0949cc7af767b6daf5018bc", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.20689406336623523, "ground_truth": 0}, {"key": "589dc58218fe8920f0949cc7af767b6daf5018bc", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.3191213793241882, "ground_truth": 0}, {"key": "06254d21e94c9c0b027629a1df90298887c31f14", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.7057850301379144, "ground_truth": 0}, {"key": "06254d21e94c9c0b027629a1df90298887c31f14", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.462958596180668, "ground_truth": 0}, {"key": "06254d21e94c9c0b027629a1df90298887c31f14", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.5234203614529259, "ground_truth": 0}, {"key": "06254d21e94c9c0b027629a1df90298887c31f14", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.37022537209321293, "ground_truth": 0}, {"key": "06254d21e94c9c0b027629a1df90298887c31f14", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.43206339337608596, "ground_truth": 0}, {"key": "5b93cafa2843ab23eb5baf8bb0bec93d0fc46864", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.2991051782896685, "ground_truth": 0}, {"key": "5b93cafa2843ab23eb5baf8bb0bec93d0fc46864", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.24508498765468947, "ground_truth": 0}, {"key": "5b93cafa2843ab23eb5baf8bb0bec93d0fc46864", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.3830641581794738, "ground_truth": 0}, {"key": "5b93cafa2843ab23eb5baf8bb0bec93d0fc46864", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.3684057094120655, "ground_truth": 0}, {"key": "5b93cafa2843ab23eb5baf8bb0bec93d0fc46864", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.43782349697344214, "ground_truth": 0}, {"key": "22f9667453cf7ea8a39080edde645776d5edc6f7", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.20689405031265057, "ground_truth": 0}, {"key": "22f9667453cf7ea8a39080edde645776d5edc6f7", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.6774740016878013, "ground_truth": 0}, {"key": "22f9667453cf7ea8a39080edde645776d5edc6f7", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.5717666009351206, "ground_truth": 0}, {"key": "22f9667453cf7ea8a39080edde645776d5edc6f7", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.35220179046044087, "ground_truth": 0}, {"key": "22f9667453cf7ea8a39080edde645776d5edc6f7", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.486331530884902, "ground_truth": 0}, {"key": "521fc18da417d441ba600a4abdbf279bb0c8f69d", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.5195213192724296, "ground_truth": 0}, {"key": "521fc18da417d441ba600a4abdbf279bb0c8f69d", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.808067193184766, "ground_truth": 0}, {"key": "521fc18da417d441ba600a4abdbf279bb0c8f69d", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.5832033505794868, "ground_truth": 0}, {"key": "521fc18da417d441ba600a4abdbf279bb0c8f69d", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.37937839028854514, "ground_truth": 0}, {"key": "521fc18da417d441ba600a4abdbf279bb0c8f69d", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.49218812503108944, "ground_truth": 0}, {"key": "48fd5553806beaaa508596b0c8267a1ee703a8fe", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.23231014473256004, "ground_truth": 0}, {"key": "48fd5553806beaaa508596b0c8267a1ee703a8fe", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.2643583698478674, "ground_truth": 0}, {"key": "48fd5553806beaaa508596b0c8267a1ee703a8fe", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.39606817139239214, "ground_truth": 0}, {"key": "48fd5553806beaaa508596b0c8267a1ee703a8fe", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.24944724468478127, "ground_truth": 0}, {"key": "48fd5553806beaaa508596b0c8267a1ee703a8fe", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.42441199340854396, "ground_truth": 0}, {"key": "f9b3e0253b7325cd0d37841a38c9f10a22c77c49", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.08093671473737236, "ground_truth": 0}, {"key": "f9b3e0253b7325cd0d37841a38c9f10a22c77c49", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.18713268717955395, "ground_truth": 0}, {"key": "f9b3e0253b7325cd0d37841a38c9f10a22c77c49", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.264358358079619, "ground_truth": 0}, {"key": "f9b3e0253b7325cd0d37841a38c9f10a22c77c49", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.13568954621477208, "ground_truth": 0}, {"key": "f9b3e0253b7325cd0d37841a38c9f10a22c77c49", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.10230469918612381, "ground_truth": 0}, {"key": "3228a9d82b3829a4f09698b746db4036ebb38ad0", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.5736783995869762, "ground_truth": 0}, {"key": "3228a9d82b3829a4f09698b746db4036ebb38ad0", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.5156199204031046, "ground_truth": 0}, {"key": "3228a9d82b3829a4f09698b746db4036ebb38ad0", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.6352224348709136, "ground_truth": 0}, {"key": "3228a9d82b3829a4f09698b746db4036ebb38ad0", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.38676342816330017, "ground_truth": 0}, {"key": "3228a9d82b3829a4f09698b746db4036ebb38ad0", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.7248702753685676, "ground_truth": 0}, {"key": "ee02f2bd6eaf55c06fef208248197679d2d96897", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.44167303262735885, "ground_truth": 0}, {"key": "ee02f2bd6eaf55c06fef208248197679d2d96897", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.44167301050424645, "ground_truth": 0}, {"key": "ee02f2bd6eaf55c06fef208248197679d2d96897", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.16026602943194915, "ground_truth": 0}, {"key": "ee02f2bd6eaf55c06fef208248197679d2d96897", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.2422056364489965, "ground_truth": 0}, {"key": "ee02f2bd6eaf55c06fef208248197679d2d96897", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.3849121392139684, "ground_truth": 0}, {"key": "c8da607c6ffe49104ceacd4fe484581042e7f21a", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.707404696350107, "ground_truth": 0}, {"key": "c8da607c6ffe49104ceacd4fe484581042e7f21a", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.08694165663047392, "ground_truth": 0}, {"key": "c8da607c6ffe49104ceacd4fe484581042e7f21a", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.25832598076949626, "ground_truth": 0}, {"key": "c8da607c6ffe49104ceacd4fe484581042e7f21a", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.5869964216619559, "ground_truth": 0}, {"key": "c8da607c6ffe49104ceacd4fe484581042e7f21a", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.5195213489769842, "ground_truth": 0}, {"key": "aeca50944e5a49735193304117849531fb4d667d", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.2658804717561354, "ground_truth": 0}, {"key": "aeca50944e5a49735193304117849531fb4d667d", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.11596071971147512, "ground_truth": 0}, {"key": "aeca50944e5a49735193304117849531fb4d667d", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.3293917142594939, "ground_truth": 0}, {"key": "aeca50944e5a49735193304117849531fb4d667d", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.15817435290323112, "ground_truth": 0}, {"key": "aeca50944e5a49735193304117849531fb4d667d", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.1778108639114937, "ground_truth": 0}, {"key": "301c27b4468420252a14f4c87c2b208c6b3259e1", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.20307463045696358, "ground_truth": 0}, {"key": "301c27b4468420252a14f4c87c2b208c6b3259e1", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.48242911715393993, "ground_truth": 0}, {"key": "301c27b4468420252a14f4c87c2b208c6b3259e1", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.2766905351386333, "ground_truth": 0}, {"key": "301c27b4468420252a14f4c87c2b208c6b3259e1", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.5058590891372564, "ground_truth": 0}, {"key": "301c27b4468420252a14f4c87c2b208c6b3259e1", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.2829881300393677, "ground_truth": 0}, {"key": "9b5fc45f61bff9323a7744c1db605618763cb85c", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.20817893328798054, "ground_truth": 0}, {"key": "9b5fc45f61bff9323a7744c1db605618763cb85c", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.39981165093213833, "ground_truth": 0}, {"key": "9b5fc45f61bff9323a7744c1db605618763cb85c", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.09670579021042691, "ground_truth": 0}, {"key": "9b5fc45f61bff9323a7744c1db605618763cb85c", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.23510837604053844, "ground_truth": 0}, {"key": "9b5fc45f61bff9323a7744c1db605618763cb85c", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.38306418190564695, "ground_truth": 0}, {"key": "43144b95b0f947f2c6d40122fecd69ced8a4af92", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.7592253967315448, "ground_truth": 0}, {"key": "43144b95b0f947f2c6d40122fecd69ced8a4af92", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.3593641429886007, "ground_truth": 0}, {"key": "43144b95b0f947f2c6d40122fecd69ced8a4af92", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.3259495303381333, "ground_truth": 0}, {"key": "43144b95b0f947f2c6d40122fecd69ced8a4af92", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.7310585533646881, "ground_truth": 0}, {"key": "43144b95b0f947f2c6d40122fecd69ced8a4af92", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.7122321845694204, "ground_truth": 0}, {"key": "58b49fef1d6d2be5211848adc2882b59f043a933", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.509764371184465, "ground_truth": 0}, {"key": "58b49fef1d6d2be5211848adc2882b59f043a933", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.3504213812215476, "ground_truth": 0}, {"key": "58b49fef1d6d2be5211848adc2882b59f043a933", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.5350984298320915, "ground_truth": 0}, {"key": "58b49fef1d6d2be5211848adc2882b59f043a933", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.35936413619927426, "ground_truth": 0}, {"key": "58b49fef1d6d2be5211848adc2882b59f043a933", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.523420352887759, "ground_truth": 0}, {"key": "bdcc1253f679b14e54451db44f4f0e39af4bb559", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.3486451435438523, "ground_truth": 0}, {"key": "bdcc1253f679b14e54451db44f4f0e39af4bb559", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.2689414381827389, "ground_truth": 0}, {"key": "bdcc1253f679b14e54451db44f4f0e39af4bb559", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.3575675166541288, "ground_truth": 0}, {"key": "bdcc1253f679b14e54451db44f4f0e39af4bb559", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.19930799993384582, "ground_truth": 0}, {"key": "bdcc1253f679b14e54451db44f4f0e39af4bb559", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.4130035776725065, "ground_truth": 0}, {"key": "b22b1636da5dd15364b6f0c342e4ce4903e51c2a", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.42441200061199225, "ground_truth": 0}, {"key": "b22b1636da5dd15364b6f0c342e4ce4903e51c2a", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.4073334133039597, "ground_truth": 0}, {"key": "b22b1636da5dd15364b6f0c342e4ce4903e51c2a", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.5253688155191649, "ground_truth": 0}, {"key": "b22b1636da5dd15364b6f0c342e4ce4903e51c2a", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.13206615708326816, "ground_truth": 0}, {"key": "b22b1636da5dd15364b6f0c342e4ce4903e51c2a", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.33982761455242316, "ground_truth": 0}, {"key": "55986d11e0d0e5b031567157cf1f157610c65c31", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.550607355224469, "ground_truth": 0}, {"key": "55986d11e0d0e5b031567157cf1f157610c65c31", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.546738149821806, "ground_truth": 0}, {"key": "55986d11e0d0e5b031567157cf1f157610c65c31", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.6859494572685683, "ground_truth": 0}, {"key": "55986d11e0d0e5b031567157cf1f157610c65c31", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.569852642642338, "ground_truth": 0}, {"key": "55986d11e0d0e5b031567157cf1f157610c65c31", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.45519863784204434, "ground_truth": 0}, {"key": "0a37124fe35e31ae9fe8dd7715aeed88002e23e9", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.18476750870976671, "ground_truth": 0}, {"key": "0a37124fe35e31ae9fe8dd7715aeed88002e23e9", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.2782567937277557, "ground_truth": 0}, {"key": "0a37124fe35e31ae9fe8dd7715aeed88002e23e9", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.12168575114852487, "ground_truth": 0}, {"key": "0a37124fe35e31ae9fe8dd7715aeed88002e23e9", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.07864238118139981, "ground_truth": 0}, {"key": "0a37124fe35e31ae9fe8dd7715aeed88002e23e9", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.22541661141523203, "ground_truth": 0}, {"key": "ef3ee3ab85ed8802b6b76444bccb46256077963e", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.46879062486316525, "ground_truth": 0}, {"key": "ef3ee3ab85ed8802b6b76444bccb46256077963e", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.35936414843172665, "ground_truth": 0}, {"key": "ef3ee3ab85ed8802b6b76444bccb46256077963e", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.6688802702344817, "ground_truth": 0}, {"key": "ef3ee3ab85ed8802b6b76444bccb46256077963e", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.45713673373580216, "ground_truth": 0}, {"key": "ef3ee3ab85ed8802b6b76444bccb46256077963e", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.5698526762024039, "ground_truth": 0}, {"key": "fb17ac082bd3f3af3dad8c8d36d9ea56360c520e", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.5794004093009444, "ground_truth": 0}, {"key": "fb17ac082bd3f3af3dad8c8d36d9ea56360c520e", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.5370413783304239, "ground_truth": 0}, {"key": "fb17ac082bd3f3af3dad8c8d36d9ea56360c520e", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.5774953641764444, "ground_truth": 0}, {"key": "fb17ac082bd3f3af3dad8c8d36d9ea56360c520e", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.5907791954484518, "ground_truth": 0}, {"key": "fb17ac082bd3f3af3dad8c8d36d9ea56360c520e", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.8940517122236245, "ground_truth": 0}, {"key": "59f079f6095cbb82b0eaaa0ba5fc29cdaff1f81b", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.2068940562891748, "ground_truth": 0}, {"key": "59f079f6095cbb82b0eaaa0ba5fc29cdaff1f81b", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.27202457576854455, "ground_truth": 0}, {"key": "59f079f6095cbb82b0eaaa0ba5fc29cdaff1f81b", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.3757064887235832, "ground_truth": 0}, {"key": "59f079f6095cbb82b0eaaa0ba5fc29cdaff1f81b", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.12168575956173347, "ground_truth": 0}, {"key": "59f079f6095cbb82b0eaaa0ba5fc29cdaff1f81b", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.32252598641472313, "ground_truth": 0}, {"key": "083bc4309f2ea52be2a378e78566d7dcc9f4dd73", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.35398630529679215, "ground_truth": 0}, {"key": "083bc4309f2ea52be2a378e78566d7dcc9f4dd73", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.7549149861916727, "ground_truth": 0}, {"key": "083bc4309f2ea52be2a378e78566d7dcc9f4dd73", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.2798285087045655, "ground_truth": 0}, {"key": "083bc4309f2ea52be2a378e78566d7dcc9f4dd73", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.5019531277701956, "ground_truth": 0}, {"key": "083bc4309f2ea52be2a378e78566d7dcc9f4dd73", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.6406358518278391, "ground_truth": 0}, {"key": "ac56bd50e449bfa1d7b923415afa2ae5f7c83392", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.24653334744772815, "ground_truth": 0}, {"key": "ac56bd50e449bfa1d7b923415afa2ae5f7c83392", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.4111108566795109, "ground_truth": 0}, {"key": "ac56bd50e449bfa1d7b923415afa2ae5f7c83392", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.14128142204196856, "ground_truth": 0}, {"key": "ac56bd50e449bfa1d7b923415afa2ae5f7c83392", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.46490156628351037, "ground_truth": 0}, {"key": "ac56bd50e449bfa1d7b923415afa2ae5f7c83392", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.12168575268270006, "ground_truth": 0}, {"key": "61e4747776bd844146a9b8c7c1913c827ffbcd8a", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.42632160569757793, "ground_truth": 0}, {"key": "61e4747776bd844146a9b8c7c1913c827ffbcd8a", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.6825737292109227, "ground_truth": 0}, {"key": "61e4747776bd844146a9b8c7c1913c827ffbcd8a", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.8140527965322127, "ground_truth": 0}, {"key": "61e4747776bd844146a9b8c7c1913c827ffbcd8a", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.7476159553864324, "ground_truth": 0}, {"key": "61e4747776bd844146a9b8c7c1913c827ffbcd8a", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.8031737930298257, "ground_truth": 0}, {"key": "a9854fc40719b0d083a3fd279b6196188228a4e0", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.3468730714060245, "ground_truth": 0}, {"key": "a9854fc40719b0d083a3fd279b6196188228a4e0", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.3140505465841737, "ground_truth": 0}, {"key": "a9854fc40719b0d083a3fd279b6196188228a4e0", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.31237000438587775, "ground_truth": 0}, {"key": "a9854fc40719b0d083a3fd279b6196188228a4e0", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.2991051969158455, "ground_truth": 0}, {"key": "a9854fc40719b0d083a3fd279b6196188228a4e0", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.24944723428343415, "ground_truth": 0}, {"key": "8d37ab9fcd0248c093f6d0e5682782ebdaf5e837", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.5602526654423949, "ground_truth": 0}, {"key": "8d37ab9fcd0248c093f6d0e5682782ebdaf5e837", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.7090191305882263, "ground_truth": 0}, {"key": "8d37ab9fcd0248c093f6d0e5682782ebdaf5e837", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.41111085539572256, "ground_truth": 0}, {"key": "8d37ab9fcd0248c093f6d0e5682782ebdaf5e837", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.22953520800861935, "ground_truth": 0}, {"key": "8d37ab9fcd0248c093f6d0e5682782ebdaf5e837", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.36116472270500255, "ground_truth": 0}, {"key": "d3199d123dedcdbae55b2e9d1f658717c1d5e233", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.45326188005228046, "ground_truth": 0}, {"key": "d3199d123dedcdbae55b2e9d1f658717c1d5e233", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.2295352044152671, "ground_truth": 0}, {"key": "d3199d123dedcdbae55b2e9d1f658717c1d5e233", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.49218813185651533, "ground_truth": 0}, {"key": "d3199d123dedcdbae55b2e9d1f658717c1d5e233", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.40168780168522167, "ground_truth": 0}, {"key": "d3199d123dedcdbae55b2e9d1f658717c1d5e233", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.3702254053130012, "ground_truth": 0}, {"key": "f249ede5a3cafd2506ff2bb400291a7db1c43b76", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.963779943558065, "ground_truth": 0}, {"key": "f249ede5a3cafd2506ff2bb400291a7db1c43b76", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.5039061820145609, "ground_truth": 0}, {"key": "f249ede5a3cafd2506ff2bb400291a7db1c43b76", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.7634837748026013, "ground_truth": 0}, {"key": "f249ede5a3cafd2506ff2bb400291a7db1c43b76", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.8652240893940203, "ground_truth": 0}, {"key": "f249ede5a3cafd2506ff2bb400291a7db1c43b76", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.7745833971305497, "ground_truth": 0}, {"key": "6343a202a70e8c5d3bfa4042bfd087d78ca5805e", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.22405545271634153, "ground_truth": 0}, {"key": "6343a202a70e8c5d3bfa4042bfd087d78ca5805e", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.3793783901447507, "ground_truth": 0}, {"key": "6343a202a70e8c5d3bfa4042bfd087d78ca5805e", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.37022539234179885, "ground_truth": 0}, {"key": "6343a202a70e8c5d3bfa4042bfd087d78ca5805e", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.5156199064655081, "ground_truth": 0}, {"key": "6343a202a70e8c5d3bfa4042bfd087d78ca5805e", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.3451052731117962, "ground_truth": 0}, {"key": "da0d41b431367b51fd995573cb498c10b7f64ca0", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.5448013767661474, "ground_truth": 0}, {"key": "da0d41b431367b51fd995573cb498c10b7f64ca0", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.33807712549324614, "ground_truth": 0}, {"key": "da0d41b431367b51fd995573cb498c10b7f64ca0", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.44552954824478175, "ground_truth": 0}, {"key": "da0d41b431367b51fd995573cb498c10b7f64ca0", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.4571367175211986, "ground_truth": 0}, {"key": "da0d41b431367b51fd995573cb498c10b7f64ca0", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.34334174057019895, "ground_truth": 0}, {"key": "0620ff5fa324a35b4be54bbd2de49b42bdd0d7c0", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.6039318235737012, "ground_truth": 0}, {"key": "0620ff5fa324a35b4be54bbd2de49b42bdd0d7c0", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.9268352799449839, "ground_truth": 0}, {"key": "0620ff5fa324a35b4be54bbd2de49b42bdd0d7c0", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.9585377251348606, "ground_truth": 0}, {"key": "0620ff5fa324a35b4be54bbd2de49b42bdd0d7c0", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.6169358198636884, "ground_truth": 0}, {"key": "0620ff5fa324a35b4be54bbd2de49b42bdd0d7c0", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.8864204149374975, "ground_truth": 0}, {"key": "f0eb8f9eee266512eb604a51b482833e202531d8", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.23370635025761788, "ground_truth": 0}, {"key": "f0eb8f9eee266512eb604a51b482833e202531d8", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.3225259841554025, "ground_truth": 0}, {"key": "f0eb8f9eee266512eb604a51b482833e202531d8", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.2523840373165519, "ground_truth": 0}, {"key": "f0eb8f9eee266512eb604a51b482833e202531d8", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.5736784184491898, "ground_truth": 0}, {"key": "f0eb8f9eee266512eb604a51b482833e202531d8", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.5467381539842662, "ground_truth": 0}, {"key": "c8f743307d5d1f7f19f1474d68c9390b22f6d076", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.2942149639361399, "ground_truth": 0}, {"key": "c8f743307d5d1f7f19f1474d68c9390b22f6d076", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.17895589052754549, "ground_truth": 0}, {"key": "c8f743307d5d1f7f19f1474d68c9390b22f6d076", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.3960681898962022, "ground_truth": 0}, {"key": "c8f743307d5d1f7f19f1474d68c9390b22f6d076", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.3522017703569389, "ground_truth": 0}, {"key": "c8f743307d5d1f7f19f1474d68c9390b22f6d076", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.44939264062323514, "ground_truth": 0}, {"key": "5978abfdad91e604840a2dcc993df5ade9448e82", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.22953520878647327, "ground_truth": 0}, {"key": "5978abfdad91e604840a2dcc993df5ade9448e82", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.23231015531829446, "ground_truth": 0}, {"key": "5978abfdad91e604840a2dcc993df5ade9448e82", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.3702253826155735, "ground_truth": 0}, {"key": "5978abfdad91e604840a2dcc993df5ade9448e82", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.38676346637892983, "ground_truth": 0}, {"key": "5978abfdad91e604840a2dcc993df5ade9448e82", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.22541660391279772, "ground_truth": 0}, {"key": "5bcd4e61b39cc7ffff38ad88cd40afa208b18528", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.4016877825730596, "ground_truth": 0}, {"key": "5bcd4e61b39cc7ffff38ad88cd40afa208b18528", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.3242353833876359, "ground_truth": 0}, {"key": "5bcd4e61b39cc7ffff38ad88cd40afa208b18528", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.20561504802955025, "ground_truth": 0}, {"key": "5bcd4e61b39cc7ffff38ad88cd40afa208b18528", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.3575675357725526, "ground_truth": 0}, {"key": "5bcd4e61b39cc7ffff38ad88cd40afa208b18528", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.37204879688287606, "ground_truth": 0}, {"key": "44815c184e3013f07781311b30ec5ff009174738", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.43206340540920146, "ground_truth": 0}, {"key": "44815c184e3013f07781311b30ec5ff009174738", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.2958398688411802, "ground_truth": 0}, {"key": "44815c184e3013f07781311b30ec5ff009174738", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.2005576708253492, "ground_truth": 0}, {"key": "44815c184e3013f07781311b30ec5ff009174738", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.3557748730087751, "ground_truth": 0}, {"key": "44815c184e3013f07781311b30ec5ff009174738", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.11279540089363199, "ground_truth": 0}, {"key": "d7783bd2bf5ad92156962380342411c2eb068853", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.5563995857334302, "ground_truth": 0}, {"key": "d7783bd2bf5ad92156962380342411c2eb068853", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.649578628846341, "ground_truth": 0}, {"key": "d7783bd2bf5ad92156962380342411c2eb068853", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.729519791954444, "ground_truth": 0}, {"key": "d7783bd2bf5ad92156962380342411c2eb068853", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.4804786783326561, "ground_truth": 0}, {"key": "d7783bd2bf5ad92156962380342411c2eb068853", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.5583269713949917, "ground_truth": 0}, {"key": "4963edb0ad2703e9f6c54593149d9b81e7ada91f", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.18594719308459642, "ground_truth": 0}, {"key": "4963edb0ad2703e9f6c54593149d9b81e7ada91f", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.32252598840312796, "ground_truth": 0}, {"key": "4963edb0ad2703e9f6c54593149d9b81e7ada91f", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.25982564855144424, "ground_truth": 0}, {"key": "4963edb0ad2703e9f6c54593149d9b81e7ada91f", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.24220562860076517, "ground_truth": 0}, {"key": "4963edb0ad2703e9f6c54593149d9b81e7ada91f", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.3757064895029688, "ground_truth": 0}, {"key": "51b9a2d46dac43952e713874a5769be5ae350626", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.1766716111647136, "ground_truth": 0}, {"key": "51b9a2d46dac43952e713874a5769be5ae350626", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.17106119198212444, "ground_truth": 0}, {"key": "51b9a2d46dac43952e713874a5769be5ae350626", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.2173375194024273, "ground_truth": 0}, {"key": "51b9a2d46dac43952e713874a5769be5ae350626", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.16885695455461774, "ground_truth": 0}, {"key": "51b9a2d46dac43952e713874a5769be5ae350626", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.10743747211029568, "ground_truth": 0}, {"key": "d670da295571f998bd0864540e2acd109d077131", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.2829881215987203, "ground_truth": 0}, {"key": "d670da295571f998bd0864540e2acd109d077131", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.20181322195378432, "ground_truth": 0}, {"key": "d670da295571f998bd0864540e2acd109d077131", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.24653334750539904, "ground_truth": 0}, {"key": "d670da295571f998bd0864540e2acd109d077131", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.4130035823713417, "ground_truth": 0}, {"key": "d670da295571f998bd0864540e2acd109d077131", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.6132365730192911, "ground_truth": 0}, {"key": "f2f2246150d06734b2fab694a39bd8d693c7d255", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.15713685881131467, "ground_truth": 0}, {"key": "f2f2246150d06734b2fab694a39bd8d693c7d255", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.2107662882159102, "ground_truth": 0}, {"key": "f2f2246150d06734b2fab694a39bd8d693c7d255", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.2798285113531909, "ground_truth": 0}, {"key": "f2f2246150d06734b2fab694a39bd8d693c7d255", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.28776780211106306, "ground_truth": 0}, {"key": "f2f2246150d06734b2fab694a39bd8d693c7d255", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.1812632136262485, "ground_truth": 0}, {"key": "3cc0409612242093f34ea1d8ca1679f434955cff", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.1980641779859026, "ground_truth": 0}, {"key": "3cc0409612242093f34ea1d8ca1679f434955cff", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.2877678079968429, "ground_truth": 0}, {"key": "3cc0409612242093f34ea1d8ca1679f434955cff", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.2295352134859368, "ground_truth": 0}, {"key": "3cc0409612242093f34ea1d8ca1679f434955cff", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.36116471691771046, "ground_truth": 0}, {"key": "3cc0409612242093f34ea1d8ca1679f434955cff", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.22000710818460378, "ground_truth": 0}, {"key": "a67c4eaf797da7df18a715cd30c6cf11db96c954", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.30074558012407077, "ground_truth": 0}, {"key": "a67c4eaf797da7df18a715cd30c6cf11db96c954", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.14511535393582747, "ground_truth": 0}, {"key": "a67c4eaf797da7df18a715cd30c6cf11db96c954", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.29259530881749146, "ground_truth": 0}, {"key": "a67c4eaf797da7df18a715cd30c6cf11db96c954", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.34687308127979116, "ground_truth": 0}, {"key": "a67c4eaf797da7df18a715cd30c6cf11db96c954", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.3311197464797725, "ground_truth": 0}, {"key": "58456413c8bd03a8ce70eb0061af07c6a9824fc3", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.2766905167892458, "ground_truth": 0}, {"key": "58456413c8bd03a8ce70eb0061af07c6a9824fc3", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.6352224323008758, "ground_truth": 0}, {"key": "58456413c8bd03a8ce70eb0061af07c6a9824fc3", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.5794004099199703, "ground_truth": 0}, {"key": "58456413c8bd03a8ce70eb0061af07c6a9824fc3", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.4244120056334327, "ground_truth": 0}, {"key": "58456413c8bd03a8ce70eb0061af07c6a9824fc3", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.18126321244863172, "ground_truth": 0}, {"key": "da040b67082b56436ccc8479a4e435cbf892a1f2", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.07696083646685149, "ground_truth": 0}, {"key": "da040b67082b56436ccc8479a4e435cbf892a1f2", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.13477591794686825, "ground_truth": 0}, {"key": "da040b67082b56436ccc8479a4e435cbf892a1f2", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.1602660293398053, "ground_truth": 0}, {"key": "da040b67082b56436ccc8479a4e435cbf892a1f2", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.18832397308376655, "ground_truth": 0}, {"key": "da040b67082b56436ccc8479a4e435cbf892a1f2", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.2509127890946563, "ground_truth": 0}, {"key": "c71748bb246a2b05e676862b75b38fa03bf6646e", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.37022538261999616, "ground_truth": 0}, {"key": "c71748bb246a2b05e676862b75b38fa03bf6646e", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.6442251124628035, "ground_truth": 0}, {"key": "c71748bb246a2b05e676862b75b38fa03bf6646e", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.27202457056388146, "ground_truth": 0}, {"key": "c71748bb246a2b05e676862b75b38fa03bf6646e", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.14318769951445137, "ground_truth": 0}, {"key": "c71748bb246a2b05e676862b75b38fa03bf6646e", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.30735802615888014, "ground_truth": 0}, {"key": "800f8dc06596c30444526bf31dd0db7504391a82", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.426321595273529, "ground_truth": 0}, {"key": "800f8dc06596c30444526bf31dd0db7504391a82", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.6076631879334959, "ground_truth": 0}, {"key": "800f8dc06596c30444526bf31dd0db7504391a82", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.1732882050401825, "ground_truth": 0}, {"key": "800f8dc06596c30444526bf31dd0db7504391a82", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.4397473399234929, "ground_truth": 0}, {"key": "800f8dc06596c30444526bf31dd0db7504391a82", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.529263386160256, "ground_truth": 0}, {"key": "3b0ed227dc7e5292e302183282d8bbe23d7b1db2", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.11047114161986013, "ground_truth": 0}, {"key": "3b0ed227dc7e5292e302183282d8bbe23d7b1db2", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.15610489474988568, "ground_truth": 0}, {"key": "3b0ed227dc7e5292e302183282d8bbe23d7b1db2", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.2735744066089061, "ground_truth": 0}, {"key": "3b0ed227dc7e5292e302183282d8bbe23d7b1db2", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.13028542787383046, "ground_truth": 0}, {"key": "3b0ed227dc7e5292e302183282d8bbe23d7b1db2", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.10447731908837123, "ground_truth": 0}, {"key": "1e713005e16983f75222235967c0cbeb0b944f80", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.2814056042198774, "ground_truth": 0}, {"key": "1e713005e16983f75222235967c0cbeb0b944f80", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.4707366211463772, "ground_truth": 0}, {"key": "1e713005e16983f75222235967c0cbeb0b944f80", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.25832597523268297, "ground_truth": 0}, {"key": "1e713005e16983f75222235967c0cbeb0b944f80", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.6671476598494321, "ground_truth": 0}, {"key": "1e713005e16983f75222235967c0cbeb0b944f80", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.3468730853566624, "ground_truth": 0}, {"key": "360ae10bc8bd30a2aca7bc6b7000e138af63adb1", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.5156199027690518, "ground_truth": 0}, {"key": "360ae10bc8bd30a2aca7bc6b7000e138af63adb1", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.880797077851088, "ground_truth": 0}, {"key": "360ae10bc8bd30a2aca7bc6b7000e138af63adb1", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.7248702781847568, "ground_truth": 0}, {"key": "360ae10bc8bd30a2aca7bc6b7000e138af63adb1", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.6943026725495495, "ground_truth": 0}, {"key": "360ae10bc8bd30a2aca7bc6b7000e138af63adb1", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.967899292097777, "ground_truth": 0}, {"key": "50e996059a005d15e3e89b5a3c3695309671ed34", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.2974699127449292, "ground_truth": 0}, {"key": "50e996059a005d15e3e89b5a3c3695309671ed34", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.2379298890083919, "ground_truth": 0}, {"key": "50e996059a005d15e3e89b5a3c3695309671ed34", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.3328523294806514, "ground_truth": 0}, {"key": "50e996059a005d15e3e89b5a3c3695309671ed34", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.4493926212358885, "ground_truth": 0}, {"key": "50e996059a005d15e3e89b5a3c3695309671ed34", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.3311197596102492, "ground_truth": 0}, {"key": "ccc7f6a2139593c47f6b5880f1e3eef9e7a69734", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.2798285023281498, "ground_truth": 0}, {"key": "ccc7f6a2139593c47f6b5880f1e3eef9e7a69734", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.4186969380601334, "ground_truth": 0}, {"key": "ccc7f6a2139593c47f6b5880f1e3eef9e7a69734", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.4339814694523356, "ground_truth": 0}, {"key": "ccc7f6a2139593c47f6b5880f1e3eef9e7a69734", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.5195213355828936, "ground_truth": 0}, {"key": "ccc7f6a2139593c47f6b5880f1e3eef9e7a69734", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.6477982265368426, "ground_truth": 0}, {"key": "f4f90d4ff5af3e3648055673e040f0f43ae076d2", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.36296919272986206, "ground_truth": 0}, {"key": "f4f90d4ff5af3e3648055673e040f0f43ae076d2", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.5660185289508406, "ground_truth": 0}, {"key": "f4f90d4ff5af3e3648055673e040f0f43ae076d2", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.4378235000614425, "ground_truth": 0}, {"key": "f4f90d4ff5af3e3648055673e040f0f43ae076d2", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.2568320082862002, "ground_truth": 0}, {"key": "f4f90d4ff5af3e3648055673e040f0f43ae076d2", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.2120688008409678, "ground_truth": 0}, {"key": "6c9ec6b9d3e936d2394f74354d577fdfcdd985a3", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.14318771590438265, "ground_truth": 0}, {"key": "6c9ec6b9d3e936d2394f74354d577fdfcdd985a3", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.45326184606572384, "ground_truth": 0}, {"key": "6c9ec6b9d3e936d2394f74354d577fdfcdd985a3", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.2186693721995297, "ground_truth": 0}, {"key": "6c9ec6b9d3e936d2394f74354d577fdfcdd985a3", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.2281564905389815, "ground_truth": 0}, {"key": "6c9ec6b9d3e936d2394f74354d577fdfcdd985a3", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.21469141623232, "ground_truth": 0}, {"key": "438a2046f4465fb1f6dab1cb327ef9ca86a4cc0d", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.15203224566185455, "ground_truth": 0}, {"key": "438a2046f4465fb1f6dab1cb327ef9ca86a4cc0d", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.15002881870878407, "ground_truth": 0}, {"key": "438a2046f4465fb1f6dab1cb327ef9ca86a4cc0d", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.2351083949109391, "ground_truth": 0}, {"key": "438a2046f4465fb1f6dab1cb327ef9ca86a4cc0d", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.20055767314876757, "ground_truth": 0}, {"key": "438a2046f4465fb1f6dab1cb327ef9ca86a4cc0d", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.11279540848953554, "ground_truth": 0}, {"key": "73818f6c987b3604b8bc92c4fb03bc68af196b77", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.14608725005053566, "ground_truth": 0}, {"key": "73818f6c987b3604b8bc92c4fb03bc68af196b77", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.0869416613545807, "ground_truth": 0}, {"key": "73818f6c987b3604b8bc92c4fb03bc68af196b77", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.16885695775124346, "ground_truth": 0}, {"key": "73818f6c987b3604b8bc92c4fb03bc68af196b77", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.052618955321141664, "ground_truth": 0}, {"key": "73818f6c987b3604b8bc92c4fb03bc68af196b77", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.1812632134932177, "ground_truth": 0}, {"key": "f06d91f46326752b02cdc48e8fa472dcc38a0846", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.38491216102480036, "ground_truth": 0}, {"key": "f06d91f46326752b02cdc48e8fa472dcc38a0846", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.15405757120664887, "ground_truth": 0}, {"key": "f06d91f46326752b02cdc48e8fa472dcc38a0846", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.3174262838719212, "ground_truth": 0}, {"key": "f06d91f46326752b02cdc48e8fa472dcc38a0846", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.42441201008885315, "ground_truth": 0}, {"key": "f06d91f46326752b02cdc48e8fa472dcc38a0846", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.4902356136194329, "ground_truth": 0}, {"key": "c54bee6384d58517757ad5a8a30ea6dc59980a07", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.32252598931329723, "ground_truth": 0}, {"key": "c54bee6384d58517757ad5a8a30ea6dc59980a07", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.22678362788085388, "ground_truth": 0}, {"key": "c54bee6384d58517757ad5a8a30ea6dc59980a07", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.11920292436861876, "ground_truth": 0}, {"key": "c54bee6384d58517757ad5a8a30ea6dc59980a07", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.065127549264925, "ground_truth": 0}, {"key": "c54bee6384d58517757ad5a8a30ea6dc59980a07", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.4610167855616611, "ground_truth": 0}, {"key": "2757ff294ae08e977ed6a2b6e1854210f28f12c9", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.5945512840692098, "ground_truth": 0}, {"key": "2757ff294ae08e977ed6a2b6e1854210f28f12c9", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.8386797645850044, "ground_truth": 0}, {"key": "2757ff294ae08e977ed6a2b6e1854210f28f12c9", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.890294225586906, "ground_truth": 0}, {"key": "2757ff294ae08e977ed6a2b6e1854210f28f12c9", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.6842640199546353, "ground_truth": 0}, {"key": "2757ff294ae08e977ed6a2b6e1854210f28f12c9", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.6893056141547599, "ground_truth": 0}, {"key": "6a004c991c482f664ab8ac78df0bda26860b1c7a", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.15203225134366516, "ground_truth": 0}, {"key": "6a004c991c482f664ab8ac78df0bda26860b1c7a", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.5253688112247387, "ground_truth": 0}, {"key": "6a004c991c482f664ab8ac78df0bda26860b1c7a", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.3056973089471198, "ground_truth": 0}, {"key": "6a004c991c482f664ab8ac78df0bda26860b1c7a", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.414898836658645, "ground_truth": 0}, {"key": "6a004c991c482f664ab8ac78df0bda26860b1c7a", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.12421301718049756, "ground_truth": 0}, {"key": "69159eadf4dcb2b7850f3a4db6454f8209f33e3a", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.2942149757193756, "ground_truth": 0}, {"key": "69159eadf4dcb2b7850f3a4db6454f8209f33e3a", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.781330620052409, "ground_truth": 0}, {"key": "69159eadf4dcb2b7850f3a4db6454f8209f33e3a", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.22953520601748587, "ground_truth": 0}, {"key": "69159eadf4dcb2b7850f3a4db6454f8209f33e3a", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.4111108483607757, "ground_truth": 0}, {"key": "69159eadf4dcb2b7850f3a4db6454f8209f33e3a", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.3522017834706626, "ground_truth": 0}, {"key": "c6129a4c1fbd5680f512da18fb60a19a74f4959e", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.5983121863326871, "ground_truth": 0}, {"key": "c6129a4c1fbd5680f512da18fb60a19a74f4959e", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.6460137058991373, "ground_truth": 0}, {"key": "c6129a4c1fbd5680f512da18fb60a19a74f4959e", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.30074557409720615, "ground_truth": 0}, {"key": "c6129a4c1fbd5680f512da18fb60a19a74f4959e", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.37204878589774565, "ground_truth": 0}, {"key": "c6129a4c1fbd5680f512da18fb60a19a74f4959e", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.7356416225072375, "ground_truth": 0}, {"key": "1fe7d16db2c7a742dc1bcf04bfb8e285e7909f03", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.40356686822023236, "ground_truth": 0}, {"key": "1fe7d16db2c7a742dc1bcf04bfb8e285e7909f03", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.3867634596814215, "ground_truth": 0}, {"key": "1fe7d16db2c7a742dc1bcf04bfb8e285e7909f03", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.3293917307420923, "ground_truth": 0}, {"key": "1fe7d16db2c7a742dc1bcf04bfb8e285e7909f03", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.4130035751791134, "ground_truth": 0}, {"key": "1fe7d16db2c7a742dc1bcf04bfb8e285e7909f03", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.18126321318050195, "ground_truth": 0}, {"key": "e0ddf766661004eb3ff337d95e249073410f0755", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.24653333904200203, "ground_truth": 0}, {"key": "e0ddf766661004eb3ff337d95e249073410f0755", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.6334102687386748, "ground_truth": 0}, {"key": "e0ddf766661004eb3ff337d95e249073410f0755", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.2735744011044044, "ground_truth": 0}, {"key": "e0ddf766661004eb3ff337d95e249073410f0755", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.4301473555111698, "ground_truth": 0}, {"key": "e0ddf766661004eb3ff337d95e249073410f0755", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.2186693715863465, "ground_truth": 0}, {"key": "dd37d70b837b24247e9abafe8fb5bc5fae5de464", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.8311430475020851, "ground_truth": 0}, {"key": "dd37d70b837b24247e9abafe8fb5bc5fae5de464", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.7138307408154558, "ground_truth": 0}, {"key": "dd37d70b837b24247e9abafe8fb5bc5fae5de464", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.4921881410622181, "ground_truth": 0}, {"key": "dd37d70b837b24247e9abafe8fb5bc5fae5de464", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.7826624879072507, "ground_truth": 0}, {"key": "dd37d70b837b24247e9abafe8fb5bc5fae5de464", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.7106283081421286, "ground_truth": 0}, {"key": "6e3028e9ae17ab59abc7732fe840468ac9dcb60c", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.19559407215989355, "ground_truth": 0}, {"key": "6e3028e9ae17ab59abc7732fe840468ac9dcb60c", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.2213506921629591, "ground_truth": 0}, {"key": "6e3028e9ae17ab59abc7732fe840468ac9dcb60c", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.1710611916969613, "ground_truth": 0}, {"key": "6e3028e9ae17ab59abc7732fe840468ac9dcb60c", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.20561504468721603, "ground_truth": 0}, {"key": "6e3028e9ae17ab59abc7732fe840468ac9dcb60c", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.222700146713138, "ground_truth": 0}, {"key": "24d2f15f65bfb5608c75d19ba07fc410aab4d9c6", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.8791467715596681, "ground_truth": 0}, {"key": "24d2f15f65bfb5608c75d19ba07fc410aab4d9c6", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.8962513720753895, "ground_truth": 0}, {"key": "24d2f15f65bfb5608c75d19ba07fc410aab4d9c6", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.773216363825452, "ground_truth": 0}, {"key": "24d2f15f65bfb5608c75d19ba07fc410aab4d9c6", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.8255897310045477, "ground_truth": 0}, {"key": "24d2f15f65bfb5608c75d19ba07fc410aab4d9c6", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.8386797609878731, "ground_truth": 0}, {"key": "698329cc7a8d796d7635bf59d2435aa22c1a38e6", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.2479874422131136, "ground_truth": 0}, {"key": "698329cc7a8d796d7635bf59d2435aa22c1a38e6", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.22405546490535694, "ground_truth": 0}, {"key": "698329cc7a8d796d7635bf59d2435aa22c1a38e6", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.5888891290385203, "ground_truth": 0}, {"key": "698329cc7a8d796d7635bf59d2435aa22c1a38e6", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.41679665718159187, "ground_truth": 0}, {"key": "698329cc7a8d796d7635bf59d2435aa22c1a38e6", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.5506073538254935, "ground_truth": 0}, {"key": "b531a8ba685e8d461d0a491f35c9970c3dddf3dd", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.11047114961987693, "ground_truth": 0}, {"key": "b531a8ba685e8d461d0a491f35c9970c3dddf3dd", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.22953521561225707, "ground_truth": 0}, {"key": "b531a8ba685e8d461d0a491f35c9970c3dddf3dd", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.14706453395161753, "ground_truth": 0}, {"key": "b531a8ba685e8d461d0a491f35c9970c3dddf3dd", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.18359363598512082, "ground_truth": 0}, {"key": "b531a8ba685e8d461d0a491f35c9970c3dddf3dd", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.0826973408898599, "ground_truth": 0}, {"key": "5b0e686b4679910743337ce02b36dd71a5caf5eb", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.1634454334764007, "ground_truth": 0}, {"key": "5b0e686b4679910743337ce02b36dd71a5caf5eb", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.23651623488577503, "ground_truth": 0}, {"key": "5b0e686b4679910743337ce02b36dd71a5caf5eb", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.10894503434643134, "ground_truth": 0}, {"key": "5b0e686b4679910743337ce02b36dd71a5caf5eb", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.2422056394741054, "ground_truth": 0}, {"key": "5b0e686b4679910743337ce02b36dd71a5caf5eb", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.20817892293866783, "ground_truth": 0}, {"key": "980e6db610d9882443d61e36d955f02d983d3e76", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.4148988432247715, "ground_truth": 0}, {"key": "980e6db610d9882443d61e36d955f02d983d3e76", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.5273165352274454, "ground_truth": 0}, {"key": "980e6db610d9882443d61e36d955f02d983d3e76", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.2351083979856972, "ground_truth": 0}, {"key": "980e6db610d9882443d61e36d955f02d983d3e76", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.4186968858350026, "ground_truth": 0}, {"key": "980e6db610d9882443d61e36d955f02d983d3e76", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.6406358411147057, "ground_truth": 0}, {"key": "6c18984d8f30ce196e9399200dd15e373e699267", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.5136684578882784, "ground_truth": 0}, {"key": "6c18984d8f30ce196e9399200dd15e373e699267", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.32082132282389314, "ground_truth": 0}, {"key": "6c18984d8f30ce196e9399200dd15e373e699267", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.4843800684739344, "ground_truth": 0}, {"key": "6c18984d8f30ce196e9399200dd15e373e699267", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.7310585964122867, "ground_truth": 0}, {"key": "6c18984d8f30ce196e9399200dd15e373e699267", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.25534364209281807, "ground_truth": 0}, {"key": "e00f05efe2038fffc8eaa1e8eecbe9445a9483e5", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.30569732266799987, "ground_truth": 0}, {"key": "e00f05efe2038fffc8eaa1e8eecbe9445a9483e5", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.4436004258388358, "ground_truth": 0}, {"key": "e00f05efe2038fffc8eaa1e8eecbe9445a9483e5", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.6548947244411638, "ground_truth": 0}, {"key": "e00f05efe2038fffc8eaa1e8eecbe9445a9483e5", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.42632157788175223, "ground_truth": 0}, {"key": "e00f05efe2038fffc8eaa1e8eecbe9445a9483e5", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.4707366042325591, "ground_truth": 0}, {"key": "9ce109dc50fe4eca8b2d0c926d5dbd1df5f49187", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.4111108714227617, "ground_truth": 0}, {"key": "9ce109dc50fe4eca8b2d0c926d5dbd1df5f49187", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.1847675109352608, "ground_truth": 0}, {"key": "9ce109dc50fe4eca8b2d0c926d5dbd1df5f49187", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.2553436394524567, "ground_truth": 0}, {"key": "9ce109dc50fe4eca8b2d0c926d5dbd1df5f49187", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.33633105449495554, "ground_truth": 0}, {"key": "9ce109dc50fe4eca8b2d0c926d5dbd1df5f49187", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.20561502916590169, "ground_truth": 0}, {"key": "bbec538b4453859ee9c772c4de8f0eb28acd87c4", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.22405543746609835, "ground_truth": 0}, {"key": "bbec538b4453859ee9c772c4de8f0eb28acd87c4", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.18713268049946283, "ground_truth": 0}, {"key": "bbec538b4453859ee9c772c4de8f0eb28acd87c4", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.5679366018810731, "ground_truth": 0}, {"key": "bbec538b4453859ee9c772c4de8f0eb28acd87c4", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.2689414341733182, "ground_truth": 0}, {"key": "bbec538b4453859ee9c772c4de8f0eb28acd87c4", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.22953520466553687, "ground_truth": 0}, {"key": "c4e0587d1b8fcc06c2cc5cfcec42a34d314fbe44", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.29259531958268703, "ground_truth": 0}, {"key": "c4e0587d1b8fcc06c2cc5cfcec42a34d314fbe44", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.36840570855215626, "ground_truth": 0}, {"key": "c4e0587d1b8fcc06c2cc5cfcec42a34d314fbe44", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.279828495039008, "ground_truth": 0}, {"key": "c4e0587d1b8fcc06c2cc5cfcec42a34d314fbe44", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.3259495202142295, "ground_truth": 0}, {"key": "c4e0587d1b8fcc06c2cc5cfcec42a34d314fbe44", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.5774953848020059, "ground_truth": 0}, {"key": "7eaaa5bfe35344ee85eeb871a4d31cd31b12965b", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.39606817248475146, "ground_truth": 0}, {"key": "7eaaa5bfe35344ee85eeb871a4d31cd31b12965b", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.5774953629459367, "ground_truth": 0}, {"key": "7eaaa5bfe35344ee85eeb871a4d31cd31b12965b", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.322525991228854, "ground_truth": 0}, {"key": "7eaaa5bfe35344ee85eeb871a4d31cd31b12965b", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.2751297251196772, "ground_truth": 0}, {"key": "7eaaa5bfe35344ee85eeb871a4d31cd31b12965b", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.3738758285931713, "ground_truth": 0}, {"key": "9cce7373a54faccf5b5d1232c82afab9b29ab6b9", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.4416730301406445, "ground_truth": 0}, {"key": "9cce7373a54faccf5b5d1232c82afab9b29ab6b9", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.640635850287161, "ground_truth": 0}, {"key": "9cce7373a54faccf5b5d1232c82afab9b29ab6b9", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.633410240081728, "ground_truth": 0}, {"key": "9cce7373a54faccf5b5d1232c82afab9b29ab6b9", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.218669364059869, "ground_truth": 0}, {"key": "9cce7373a54faccf5b5d1232c82afab9b29ab6b9", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.5698526535410904, "ground_truth": 0}, {"key": "1b37e549bbcec859711e5b2ef310e94deed4dc95", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.6495786252702074, "ground_truth": 0}, {"key": "1b37e549bbcec859711e5b2ef310e94deed4dc95", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.771843507348681, "ground_truth": 0}, {"key": "1b37e549bbcec859711e5b2ef310e94deed4dc95", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.7534666523391415, "ground_truth": 0}, {"key": "1b37e549bbcec859711e5b2ef310e94deed4dc95", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.7310585634183634, "ground_truth": 0}, {"key": "1b37e549bbcec859711e5b2ef310e94deed4dc95", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.7839884661177087, "ground_truth": 0}, {"key": "da780ee614304d195bde3b7549313c02990d072e", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.692641988088018, "ground_truth": 0}, {"key": "da780ee614304d195bde3b7549313c02990d072e", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.6057990533467799, "ground_truth": 0}, {"key": "da780ee614304d195bde3b7549313c02990d072e", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.5058590964516957, "ground_truth": 0}, {"key": "da780ee614304d195bde3b7549313c02990d072e", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.43974732828573054, "ground_truth": 0}, {"key": "da780ee614304d195bde3b7549313c02990d072e", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.38676345188025996, "ground_truth": 0}, {"key": "e24cdc200182d698a34f564ba71f4948ce6760e5", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.044680871543168285, "ground_truth": 0}, {"key": "e24cdc200182d698a34f564ba71f4948ce6760e5", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.16344543296895386, "ground_truth": 0}, {"key": "e24cdc200182d698a34f564ba71f4948ce6760e5", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.19930800497358456, "ground_truth": 0}, {"key": "e24cdc200182d698a34f564ba71f4948ce6760e5", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.20689406734468163, "ground_truth": 0}, {"key": "e24cdc200182d698a34f564ba71f4948ce6760e5", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.15002882393131672, "ground_truth": 0}, {"key": "42483672c204aebcf7ba6e7d6ca4c628fe9a69e7", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.5813030767299516, "ground_truth": 0}, {"key": "42483672c204aebcf7ba6e7d6ca4c628fe9a69e7", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.2798284984794639, "ground_truth": 0}, {"key": "42483672c204aebcf7ba6e7d6ca4c628fe9a69e7", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.47073661383794363, "ground_truth": 0}, {"key": "42483672c204aebcf7ba6e7d6ca4c628fe9a69e7", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.5370413858017624, "ground_truth": 0}, {"key": "42483672c204aebcf7ba6e7d6ca4c628fe9a69e7", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.5964331270030817, "ground_truth": 0}, {"key": "3501c83d3dab4a2e4d2142522a4bf1510a64422a", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.4687906185105039, "ground_truth": 0}, {"key": "3501c83d3dab4a2e4d2142522a4bf1510a64422a", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.10669060231981878, "ground_truth": 0}, {"key": "3501c83d3dab4a2e4d2142522a4bf1510a64422a", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.3380771441194113, "ground_truth": 0}, {"key": "3501c83d3dab4a2e4d2142522a4bf1510a64422a", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.129402726416557, "ground_truth": 0}, {"key": "3501c83d3dab4a2e4d2142522a4bf1510a64422a", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.319121399720354, "ground_truth": 0}, {"key": "964589248c2d95ac3c734ad71283ca22ae4ecedf", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.2465333335029648, "ground_truth": 0}, {"key": "964589248c2d95ac3c734ad71283ca22ae4ecedf", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.5156198899594688, "ground_truth": 0}, {"key": "964589248c2d95ac3c734ad71283ca22ae4ecedf", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.26740815909462634, "ground_truth": 0}, {"key": "964589248c2d95ac3c734ad71283ca22ae4ecedf", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.4054487479912077, "ground_truth": 0}, {"key": "964589248c2d95ac3c734ad71283ca22ae4ecedf", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.217337517327297, "ground_truth": 0}, {"key": "6b72550a663bcb7a64e242ede6da53b1f585ea71", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.15304215517480657, "ground_truth": 0}, {"key": "6b72550a663bcb7a64e242ede6da53b1f585ea71", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.5832033628778015, "ground_truth": 0}, {"key": "6b72550a663bcb7a64e242ede6da53b1f585ea71", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.4707366099191989, "ground_truth": 0}, {"key": "6b72550a663bcb7a64e242ede6da53b1f585ea71", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.3702254125938411, "ground_truth": 0}, {"key": "6b72550a663bcb7a64e242ede6da53b1f585ea71", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.5448013827267226, "ground_truth": 0}, {"key": "c96bdfc0463d994ddc858ad358fe59371be79352", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.19559407315572505, "ground_truth": 0}, {"key": "c96bdfc0463d994ddc858ad358fe59371be79352", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.8031737924416665, "ground_truth": 0}, {"key": "c96bdfc0463d994ddc858ad358fe59371be79352", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.34864514740881614, "ground_truth": 0}, {"key": "c96bdfc0463d994ddc858ad358fe59371be79352", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.5926665916475746, "ground_truth": 0}, {"key": "c96bdfc0463d994ddc858ad358fe59371be79352", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.8864204137071365, "ground_truth": 0}, {"key": "085dc5d706487da983655043b144952956cb3c5b", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.05500528280555663, "ground_truth": 0}, {"key": "085dc5d706487da983655043b144952956cb3c5b", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.061875985247991164, "ground_truth": 0}, {"key": "085dc5d706487da983655043b144952956cb3c5b", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.08819004303148212, "ground_truth": 0}, {"key": "085dc5d706487da983655043b144952956cb3c5b", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.18594721017921745, "ground_truth": 0}, {"key": "085dc5d706487da983655043b144952956cb3c5b", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.0348808877033676, "ground_truth": 0}, {"key": "1c1dc1da2f6ba045478e25e91c8e1b039ce4cc67", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.18713268445714815, "ground_truth": 0}, {"key": "1c1dc1da2f6ba045478e25e91c8e1b039ce4cc67", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.6688802611881778, "ground_truth": 0}, {"key": "1c1dc1da2f6ba045478e25e91c8e1b039ce4cc67", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.13753246891745727, "ground_truth": 0}, {"key": "1c1dc1da2f6ba045478e25e91c8e1b039ce4cc67", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.165593118672212, "ground_truth": 0}, {"key": "1c1dc1da2f6ba045478e25e91c8e1b039ce4cc67", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.1375324638094354, "ground_truth": 0}, {"key": "da90eb668bfc66a5e70b2e6631a5ec1c9ffb2413", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.5156199341873903, "ground_truth": 0}, {"key": "da90eb668bfc66a5e70b2e6631a5ec1c9ffb2413", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.4707366187799748, "ground_truth": 0}, {"key": "da90eb668bfc66a5e70b2e6631a5ec1c9ffb2413", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.5640984733162974, "ground_truth": 0}, {"key": "da90eb668bfc66a5e70b2e6631a5ec1c9ffb2413", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.6548947194005483, "ground_truth": 0}, {"key": "da90eb668bfc66a5e70b2e6631a5ec1c9ffb2413", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.7090191391804391, "ground_truth": 0}, {"key": "717b1934db9eb0d7e5e2aef75cd54b29a6530a59", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.15002882078126137, "ground_truth": 0}, {"key": "717b1934db9eb0d7e5e2aef75cd54b29a6530a59", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.12678516663863398, "ground_truth": 0}, {"key": "717b1934db9eb0d7e5e2aef75cd54b29a6530a59", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.10158945591133095, "ground_truth": 0}, {"key": "717b1934db9eb0d7e5e2aef75cd54b29a6530a59", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.28937170260846423, "ground_truth": 0}, {"key": "717b1934db9eb0d7e5e2aef75cd54b29a6530a59", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.2568319820994169, "ground_truth": 0}, {"key": "e493fe7f282adb10c6b9af18d41f0181f17341e5", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.14903530014698887, "ground_truth": 0}, {"key": "e493fe7f282adb10c6b9af18d41f0181f17341e5", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.21076628653609278, "ground_truth": 0}, {"key": "e493fe7f282adb10c6b9af18d41f0181f17341e5", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.08632347321296491, "ground_truth": 0}, {"key": "e493fe7f282adb10c6b9af18d41f0181f17341e5", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.1789559022294069, "ground_truth": 0}, {"key": "e493fe7f282adb10c6b9af18d41f0181f17341e5", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.3451052948190438, "ground_truth": 0}, {"key": "e510fc72b8ef595e45f1a510d0cad761ae1bd032", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.31237000838460866, "ground_truth": 0}, {"key": "e510fc72b8ef595e45f1a510d0cad761ae1bd032", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.2974699391046106, "ground_truth": 0}, {"key": "e510fc72b8ef595e45f1a510d0cad761ae1bd032", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.13939638750772593, "ground_truth": 0}, {"key": "e510fc72b8ef595e45f1a510d0cad761ae1bd032", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.3123700063032548, "ground_truth": 0}, {"key": "e510fc72b8ef595e45f1a510d0cad761ae1bd032", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.4016878018407121, "ground_truth": 0}, {"key": "564e02cb944ea00c02f9832ab968441b5c67332e", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.40168780007669985, "ground_truth": 0}, {"key": "564e02cb944ea00c02f9832ab968441b5c67332e", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.4436004351409209, "ground_truth": 0}, {"key": "564e02cb944ea00c02f9832ab968441b5c67332e", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.133867490456706, "ground_truth": 0}, {"key": "564e02cb944ea00c02f9832ab968441b5c67332e", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.26435835902642124, "ground_truth": 0}, {"key": "564e02cb944ea00c02f9832ab968441b5c67332e", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.4244119695239259, "ground_truth": 0}, {"key": "dfd0cea6589cb8be40538b9f165781fbc2c7d796", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.5039061582284403, "ground_truth": 0}, {"key": "dfd0cea6589cb8be40538b9f165781fbc2c7d796", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.2689414407948177, "ground_truth": 0}, {"key": "dfd0cea6589cb8be40538b9f165781fbc2c7d796", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.525368799801086, "ground_truth": 0}, {"key": "dfd0cea6589cb8be40538b9f165781fbc2c7d796", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.6477982212128902, "ground_truth": 0}, {"key": "dfd0cea6589cb8be40538b9f165781fbc2c7d796", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.6076631745610517, "ground_truth": 0}, {"key": "dbceded6ea7d8a0944ab3f44263f688f644a5c37", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.5621765019309325, "ground_truth": 0}, {"key": "dbceded6ea7d8a0944ab3f44263f688f644a5c37", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.5292633812973778, "ground_truth": 0}, {"key": "dbceded6ea7d8a0944ab3f44263f688f644a5c37", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.6001883320823777, "ground_truth": 0}, {"key": "dbceded6ea7d8a0944ab3f44263f688f644a5c37", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.3593641379609829, "ground_truth": 0}, {"key": "dbceded6ea7d8a0944ab3f44263f688f644a5c37", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.5774953770374704, "ground_truth": 0}, {"key": "305a7272b28da5bc5574487ca0a09f48b852788c", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.2861692687301155, "ground_truth": 0}, {"key": "305a7272b28da5bc5574487ca0a09f48b852788c", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.3998116668811273, "ground_truth": 0}, {"key": "305a7272b28da5bc5574487ca0a09f48b852788c", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.34510527881801834, "ground_truth": 0}, {"key": "305a7272b28da5bc5574487ca0a09f48b852788c", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.31237000238713203, "ground_truth": 0}, {"key": "305a7272b28da5bc5574487ca0a09f48b852788c", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.20055768823260658, "ground_truth": 0}, {"key": "9814600b03458475607fa2e4e9f1637138b7c9bf", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.30735801348443753, "ground_truth": 0}, {"key": "9814600b03458475607fa2e4e9f1637138b7c9bf", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.8365545597136823, "ground_truth": 0}, {"key": "9814600b03458475607fa2e4e9f1637138b7c9bf", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.8233283850277562, "ground_truth": 0}, {"key": "9814600b03458475607fa2e4e9f1637138b7c9bf", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.7606506703260056, "ground_truth": 0}, {"key": "9814600b03458475607fa2e4e9f1637138b7c9bf", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.5156199244451984, "ground_truth": 0}, {"key": "d16bff688345742ee8a1762cb6b82b49e4a065dd", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.4339814673214609, "ground_truth": 0}, {"key": "d16bff688345742ee8a1762cb6b82b49e4a065dd", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.3942009682415432, "ground_truth": 0}, {"key": "d16bff688345742ee8a1762cb6b82b49e4a065dd", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.8068526110758202, "ground_truth": 0}, {"key": "d16bff688345742ee8a1762cb6b82b49e4a065dd", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.4493926542370169, "ground_truth": 0}, {"key": "d16bff688345742ee8a1762cb6b82b49e4a065dd", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.4960938418997997, "ground_truth": 0}, {"key": "c85a7eb698c39c7465d1fe4ebbb50447329b5497", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.9738443810351605, "ground_truth": 0}, {"key": "c85a7eb698c39c7465d1fe4ebbb50447329b5497", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.9832145095853719, "ground_truth": 0}, {"key": "c85a7eb698c39c7465d1fe4ebbb50447329b5497", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.9763105299503452, "ground_truth": 0}, {"key": "c85a7eb698c39c7465d1fe4ebbb50447329b5497", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.953966098566249, "ground_truth": 0}, {"key": "c85a7eb698c39c7465d1fe4ebbb50447329b5497", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.9766692325306977, "ground_truth": 0}, {"key": "5f299d74b492be5e53e6bcf3a54d3c8a4b418a97", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.1540575679026528, "ground_truth": 0}, {"key": "5f299d74b492be5e53e6bcf3a54d3c8a4b418a97", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.4016878105779873, "ground_truth": 0}, {"key": "5f299d74b492be5e53e6bcf3a54d3c8a4b418a97", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.16885694677153978, "ground_truth": 0}, {"key": "5f299d74b492be5e53e6bcf3a54d3c8a4b418a97", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.12506538034927892, "ground_truth": 0}, {"key": "5f299d74b492be5e53e6bcf3a54d3c8a4b418a97", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.23370634138141705, "ground_truth": 0}, {"key": "5a4e46a4e18d31d1ef4d1087b1643a349f10dd14", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.20817893347397678, "ground_truth": 0}, {"key": "5a4e46a4e18d31d1ef4d1087b1643a349f10dd14", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.8848377637929298, "ground_truth": 0}, {"key": "5a4e46a4e18d31d1ef4d1087b1643a349f10dd14", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.18242552494738346, "ground_truth": 0}, {"key": "5a4e46a4e18d31d1ef4d1087b1643a349f10dd14", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.27512972777747263, "ground_truth": 0}, {"key": "5a4e46a4e18d31d1ef4d1087b1643a349f10dd14", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.16776335064772852, "ground_truth": 0}, {"key": "b6b7cbc40f51483708d53416719205f36c06f6df", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.5486734716192314, "ground_truth": 0}, {"key": "b6b7cbc40f51483708d53416719205f36c06f6df", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.13568954535776537, "ground_truth": 0}, {"key": "b6b7cbc40f51483708d53416719205f36c06f6df", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.4726834758284174, "ground_truth": 0}, {"key": "b6b7cbc40f51483708d53416719205f36c06f6df", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.37754068257786694, "ground_truth": 0}, {"key": "b6b7cbc40f51483708d53416719205f36c06f6df", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.2628418457698227, "ground_truth": 0}, {"key": "7c0bda3744be6f7d95eef695e59a4e4001455a35", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.6334102647931212, "ground_truth": 0}, {"key": "7c0bda3744be6f7d95eef695e59a4e4001455a35", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.5794004103487231, "ground_truth": 0}, {"key": "7c0bda3744be6f7d95eef695e59a4e4001455a35", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.5736784104315372, "ground_truth": 0}, {"key": "7c0bda3744be6f7d95eef695e59a4e4001455a35", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.5273165140199669, "ground_truth": 0}, {"key": "7c0bda3744be6f7d95eef695e59a4e4001455a35", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.3812195839439607, "ground_truth": 0}, {"key": "f19b17438e69527f376e5d9efc74d19fbac6f755", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.2422056410496606, "ground_truth": 0}, {"key": "f19b17438e69527f376e5d9efc74d19fbac6f755", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.30569732081352546, "ground_truth": 0}, {"key": "f19b17438e69527f376e5d9efc74d19fbac6f755", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.14414884941102182, "ground_truth": 0}, {"key": "f19b17438e69527f376e5d9efc74d19fbac6f755", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.2068940559084605, "ground_truth": 0}, {"key": "f19b17438e69527f376e5d9efc74d19fbac6f755", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.34510527657229434, "ground_truth": 0}, {"key": "eb2fe21af9629392d61a4fabe6cad72130525f2f", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.4186969438761217, "ground_truth": 0}, {"key": "eb2fe21af9629392d61a4fabe6cad72130525f2f", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.5448013888938236, "ground_truth": 0}, {"key": "eb2fe21af9629392d61a4fabe6cad72130525f2f", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.5234203471569381, "ground_truth": 0}, {"key": "eb2fe21af9629392d61a4fabe6cad72130525f2f", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.5467381356903485, "ground_truth": 0}, {"key": "eb2fe21af9629392d61a4fabe6cad72130525f2f", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.2798285119232134, "ground_truth": 0}, {"key": "eebebdc4fa08a6e927ab958a39d91f888550afec", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.12940272527348587, "ground_truth": 0}, {"key": "eebebdc4fa08a6e927ab958a39d91f888550afec", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.8848377637929298, "ground_truth": 0}, {"key": "eebebdc4fa08a6e927ab958a39d91f888550afec", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.5525397311125197, "ground_truth": 0}, {"key": "eebebdc4fa08a6e927ab958a39d91f888550afec", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.27202455087771427, "ground_truth": 0}, {"key": "eebebdc4fa08a6e927ab958a39d91f888550afec", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.4359015261264225, "ground_truth": 0}, {"key": "94b15ad6efcd6d47dfcc242135be481fceb7f634", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.6150878458309599, "ground_truth": 0}, {"key": "94b15ad6efcd6d47dfcc242135be481fceb7f634", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.7356416490127133, "ground_truth": 0}, {"key": "94b15ad6efcd6d47dfcc242135be481fceb7f634", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.5331544123586601, "ground_truth": 0}, {"key": "94b15ad6efcd6d47dfcc242135be481fceb7f634", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.6774740269678833, "ground_truth": 0}, {"key": "94b15ad6efcd6d47dfcc242135be481fceb7f634", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.6619228840682881, "ground_truth": 0}, {"key": "504ed83e41a6a861927345f7a027ba53ad02237a", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.6584174972362482, "ground_truth": 0}, {"key": "504ed83e41a6a861927345f7a027ba53ad02237a", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.7090191305882263, "ground_truth": 0}, {"key": "504ed83e41a6a861927345f7a027ba53ad02237a", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.5019531297508972, "ground_truth": 0}, {"key": "504ed83e41a6a861927345f7a027ba53ad02237a", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.3208213206441932, "ground_truth": 0}, {"key": "504ed83e41a6a861927345f7a027ba53ad02237a", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.5195213444058217, "ground_truth": 0}, {"key": "42176b852f897ae19ef0cf39d598878c8ff0bced", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.18594720755538496, "ground_truth": 0}, {"key": "42176b852f897ae19ef0cf39d598878c8ff0bced", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.43206337810941275, "ground_truth": 0}, {"key": "42176b852f897ae19ef0cf39d598878c8ff0bced", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.2479874472198041, "ground_truth": 0}, {"key": "42176b852f897ae19ef0cf39d598878c8ff0bced", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.18476751594941948, "ground_truth": 0}, {"key": "42176b852f897ae19ef0cf39d598878c8ff0bced", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.20946969714669528, "ground_truth": 0}, {"key": "62ac534bf7e3e897b2726dddf2b7b6f7723362d4", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.5312093733647877, "ground_truth": 0}, {"key": "62ac534bf7e3e897b2726dddf2b7b6f7723362d4", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.3023910920067157, "ground_truth": 0}, {"key": "62ac534bf7e3e897b2726dddf2b7b6f7723362d4", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.764891622278641, "ground_truth": 0}, {"key": "62ac534bf7e3e897b2726dddf2b7b6f7723362d4", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.4225046141099885, "ground_truth": 0}, {"key": "62ac534bf7e3e897b2726dddf2b7b6f7723362d4", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.6943026825963001, "ground_truth": 0}, {"key": "4ff05ae8454ad482f81911c5e4275b63466bea35", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.4397473262309957, "ground_truth": 0}, {"key": "4ff05ae8454ad482f81911c5e4275b63466bea35", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.27357437990860145, "ground_truth": 0}, {"key": "4ff05ae8454ad482f81911c5e4275b63466bea35", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.372048792531296, "ground_truth": 0}, {"key": "4ff05ae8454ad482f81911c5e4275b63466bea35", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.2782567837863265, "ground_truth": 0}, {"key": "4ff05ae8454ad482f81911c5e4275b63466bea35", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.17781087344714597, "ground_truth": 0}, {"key": "16e86dc5e3fe27875ee927741542536ea7b7553b", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.4301473603904506, "ground_truth": 0}, {"key": "16e86dc5e3fe27875ee927741542536ea7b7553b", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.5409238489463043, "ground_truth": 0}, {"key": "16e86dc5e3fe27875ee927741542536ea7b7553b", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.5039061689997438, "ground_truth": 0}, {"key": "16e86dc5e3fe27875ee927741542536ea7b7553b", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.2598256450796653, "ground_truth": 0}, {"key": "16e86dc5e3fe27875ee927741542536ea7b7553b", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.32594952755448314, "ground_truth": 0}, {"key": "ad55d2f13db6732edcd716e09f527ed2df39946f", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.29910519435295563, "ground_truth": 0}, {"key": "ad55d2f13db6732edcd716e09f527ed2df39946f", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.24798743811783305, "ground_truth": 0}, {"key": "ad55d2f13db6732edcd716e09f527ed2df39946f", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.3738758030806011, "ground_truth": 0}, {"key": "ad55d2f13db6732edcd716e09f527ed2df39946f", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.19436782389326474, "ground_truth": 0}, {"key": "ad55d2f13db6732edcd716e09f527ed2df39946f", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.3363310413420101, "ground_truth": 0}, {"key": "160228fe18f272761b969b08622ba868ad65b206", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.9575961714666321, "ground_truth": 0}, {"key": "160228fe18f272761b969b08622ba868ad65b206", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.8587185850234942, "ground_truth": 0}, {"key": "160228fe18f272761b969b08622ba868ad65b206", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.7918210749181028, "ground_truth": 0}, {"key": "160228fe18f272761b969b08622ba868ad65b206", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.8418256550253523, "ground_truth": 0}, {"key": "160228fe18f272761b969b08622ba868ad65b206", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.8732148289116234, "ground_truth": 0}, {"key": "7ebb75bc91aa51d53b06fdbed7feb52d42612065", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.27669052504078334, "ground_truth": 0}, {"key": "7ebb75bc91aa51d53b06fdbed7feb52d42612065", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.8152324886972124, "ground_truth": 0}, {"key": "7ebb75bc91aa51d53b06fdbed7feb52d42612065", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.6584175048563884, "ground_truth": 0}, {"key": "7ebb75bc91aa51d53b06fdbed7feb52d42612065", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.3208213154844665, "ground_truth": 0}, {"key": "7ebb75bc91aa51d53b06fdbed7feb52d42612065", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.6460137014075518, "ground_truth": 0}, {"key": "a84e31bf36290e557a3080ad297177b6f18cdf84", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.15817435904571983, "ground_truth": 0}, {"key": "a84e31bf36290e557a3080ad297177b6f18cdf84", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.5156199096558641, "ground_truth": 0}, {"key": "a84e31bf36290e557a3080ad297177b6f18cdf84", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.13206614757256624, "ground_truth": 0}, {"key": "a84e31bf36290e557a3080ad297177b6f18cdf84", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.44360041187846166, "ground_truth": 0}, {"key": "a84e31bf36290e557a3080ad297177b6f18cdf84", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.14706453740711847, "ground_truth": 0}, {"key": "c43c7253f38ff2cd79770034ed9af3567cfaa811", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.4320634072586992, "ground_truth": 0}, {"key": "c43c7253f38ff2cd79770034ed9af3567cfaa811", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.24653334411016298, "ground_truth": 0}, {"key": "c43c7253f38ff2cd79770034ed9af3567cfaa811", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.6671476596084039, "ground_truth": 0}, {"key": "c43c7253f38ff2cd79770034ed9af3567cfaa811", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.3090237094098166, "ground_truth": 0}, {"key": "c43c7253f38ff2cd79770034ed9af3567cfaa811", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.16995623751549851, "ground_truth": 0}, {"key": "a4601415eafb5264a4bdc273de3a16365aefb35b", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.48828339726397213, "ground_truth": 0}, {"key": "a4601415eafb5264a4bdc273de3a16365aefb35b", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.5078118739026221, "ground_truth": 0}, {"key": "a4601415eafb5264a4bdc273de3a16365aefb35b", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.4205995863876775, "ground_truth": 0}, {"key": "a4601415eafb5264a4bdc273de3a16365aefb35b", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.29583987969909753, "ground_truth": 0}, {"key": "a4601415eafb5264a4bdc273de3a16365aefb35b", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.4111108608802456, "ground_truth": 0}, {"key": "91d43f137b3d928561fb62b200ae40aee4a34b73", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.5273165311934886, "ground_truth": 0}, {"key": "91d43f137b3d928561fb62b200ae40aee4a34b73", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.5945512717772071, "ground_truth": 0}, {"key": "91d43f137b3d928561fb62b200ae40aee4a34b73", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.42823338063140615, "ground_truth": 0}, {"key": "91d43f137b3d928561fb62b200ae40aee4a34b73", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.4649015598520261, "ground_truth": 0}, {"key": "91d43f137b3d928561fb62b200ae40aee4a34b73", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.6206215905718625, "ground_truth": 0}, {"key": "ab2d99eedfd685ce685fa44e735695c27e946683", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.39233682024533795, "ground_truth": 0}, {"key": "ab2d99eedfd685ce685fa44e735695c27e946683", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.40168780617544414, "ground_truth": 0}, {"key": "ab2d99eedfd685ce685fa44e735695c27e946683", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.5195213274981874, "ground_truth": 0}, {"key": "ab2d99eedfd685ce685fa44e735695c27e946683", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.47073659580097793, "ground_truth": 0}, {"key": "ab2d99eedfd685ce685fa44e735695c27e946683", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.6169358077206842, "ground_truth": 0}, {"key": "df9c4e1b8698581720b28c71f1e98f82bd6ea6e6", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.3486451479294595, "ground_truth": 0}, {"key": "df9c4e1b8698581720b28c71f1e98f82bd6ea6e6", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.4148988249398182, "ground_truth": 0}, {"key": "df9c4e1b8698581720b28c71f1e98f82bd6ea6e6", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.36296919605255307, "ground_truth": 0}, {"key": "df9c4e1b8698581720b28c71f1e98f82bd6ea6e6", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.24653335933084042, "ground_truth": 0}, {"key": "df9c4e1b8698581720b28c71f1e98f82bd6ea6e6", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.11838509326734956, "ground_truth": 0}, {"key": "a1d7a119707506100920e1a6f0d9cbf4d4e7c838", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.36477756933747124, "ground_truth": 0}, {"key": "a1d7a119707506100920e1a6f0d9cbf4d4e7c838", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.3311197270984259, "ground_truth": 0}, {"key": "a1d7a119707506100920e1a6f0d9cbf4d4e7c838", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.2613309155625505, "ground_truth": 0}, {"key": "a1d7a119707506100920e1a6f0d9cbf4d4e7c838", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.22270014927855852, "ground_truth": 0}, {"key": "a1d7a119707506100920e1a6f0d9cbf4d4e7c838", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.2553436510018326, "ground_truth": 0}, {"key": "acd2b851b367bf62dd603ebff5670ffa9c853a8f", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.11124122065764211, "ground_truth": 0}, {"key": "acd2b851b367bf62dd603ebff5670ffa9c853a8f", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.07864237831477465, "ground_truth": 0}, {"key": "acd2b851b367bf62dd603ebff5670ffa9c853a8f", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.12940272780120438, "ground_truth": 0}, {"key": "acd2b851b367bf62dd603ebff5670ffa9c853a8f", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.33458944132248164, "ground_truth": 0}, {"key": "acd2b851b367bf62dd603ebff5670ffa9c853a8f", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.24798742585690384, "ground_truth": 0}, {"key": "b9f5a02386adb698ae71cadd3fd1825fa7b998db", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.13939638518507078, "ground_truth": 0}, {"key": "b9f5a02386adb698ae71cadd3fd1825fa7b998db", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.20181322853396075, "ground_truth": 0}, {"key": "b9f5a02386adb698ae71cadd3fd1825fa7b998db", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.05261895375333757, "ground_truth": 0}, {"key": "b9f5a02386adb698ae71cadd3fd1825fa7b998db", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.044018650990661864, "ground_truth": 0}, {"key": "b9f5a02386adb698ae71cadd3fd1825fa7b998db", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.07159119843101475, "ground_truth": 0}, {"key": "c26f356dc536e5797ba550be6e27a95059f1ce53", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.4092208136753518, "ground_truth": 0}, {"key": "c26f356dc536e5797ba550be6e27a95059f1ce53", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.14223189360329494, "ground_truth": 0}, {"key": "c26f356dc536e5797ba550be6e27a95059f1ce53", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.08329192208560586, "ground_truth": 0}, {"key": "c26f356dc536e5797ba550be6e27a95059f1ce53", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.09138210811602746, "ground_truth": 0}, {"key": "c26f356dc536e5797ba550be6e27a95059f1ce53", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.5428632815665773, "ground_truth": 0}, {"key": "94a9883a283e94c3ad53069d98517b08e8853447", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.4186969245039606, "ground_truth": 0}, {"key": "94a9883a283e94c3ad53069d98517b08e8853447", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.7154239966590581, "ground_truth": 0}, {"key": "94a9883a283e94c3ad53069d98517b08e8853447", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.6909762902017746, "ground_truth": 0}, {"key": "94a9883a283e94c3ad53069d98517b08e8853447", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.724870270766598, "ground_truth": 0}, {"key": "94a9883a283e94c3ad53069d98517b08e8853447", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.8164063707442446, "ground_truth": 0}, {"key": "9c02ebeda5d84859eb36070de7e8a9517ac3fee6", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.756357543284072, "ground_truth": 0}, {"key": "9c02ebeda5d84859eb36070de7e8a9517ac3fee6", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.8116760090739178, "ground_truth": 0}, {"key": "9c02ebeda5d84859eb36070de7e8a9517ac3fee6", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.786622827940583, "ground_truth": 0}, {"key": "9c02ebeda5d84859eb36070de7e8a9517ac3fee6", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.6654105527783145, "ground_truth": 0}, {"key": "9c02ebeda5d84859eb36070de7e8a9517ac3fee6", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.8289388185123915, "ground_truth": 0}, {"key": "37ab3a49bb7732e145a24e70e6f077469ca1dbd3", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.6774739970489901, "ground_truth": 0}, {"key": "37ab3a49bb7732e145a24e70e6f077469ca1dbd3", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.6791786780508916, "ground_truth": 0}, {"key": "37ab3a49bb7732e145a24e70e6f077469ca1dbd3", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.607663165242944, "ground_truth": 0}, {"key": "37ab3a49bb7732e145a24e70e6f077469ca1dbd3", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.8056321776276395, "ground_truth": 0}, {"key": "37ab3a49bb7732e145a24e70e6f077469ca1dbd3", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.6959583271695431, "ground_truth": 0}, {"key": "fa67b52d4597e227947776fd40a4b16f402ed12d", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.8386797539702164, "ground_truth": 0}, {"key": "fa67b52d4597e227947776fd40a4b16f402ed12d", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.6370307959704534, "ground_truth": 0}, {"key": "fa67b52d4597e227947776fd40a4b16f402ed12d", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.3775406645707746, "ground_truth": 0}, {"key": "fa67b52d4597e227947776fd40a4b16f402ed12d", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.5679366012306569, "ground_truth": 0}, {"key": "fa67b52d4597e227947776fd40a4b16f402ed12d", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.9053222962822208, "ground_truth": 0}, {"key": "cafb6a9801a85984042abcd7e552d1e129dff4cf", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.3208213071360947, "ground_truth": 0}, {"key": "cafb6a9801a85984042abcd7e552d1e129dff4cf", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.37022539409423005, "ground_truth": 0}, {"key": "cafb6a9801a85984042abcd7e552d1e129dff4cf", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.09602549520929318, "ground_truth": 0}, {"key": "cafb6a9801a85984042abcd7e552d1e129dff4cf", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.2829881372727131, "ground_truth": 0}, {"key": "cafb6a9801a85984042abcd7e552d1e129dff4cf", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.26588046649400526, "ground_truth": 0}, {"key": "12a24b1aba082a5fd0687a14015e1e58090ed9c6", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.3629691869687776, "ground_truth": 0}, {"key": "12a24b1aba082a5fd0687a14015e1e58090ed9c6", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.3720487796603925, "ground_truth": 0}, {"key": "12a24b1aba082a5fd0687a14015e1e58090ed9c6", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.4130036076549532, "ground_truth": 0}, {"key": "12a24b1aba082a5fd0687a14015e1e58090ed9c6", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.3040416885074869, "ground_truth": 0}, {"key": "12a24b1aba082a5fd0687a14015e1e58090ed9c6", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.3293917367075652, "ground_truth": 0}, {"key": "c8ebf6f48257a704202c7b6df238bc1cbfa838d7", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.3886180059210395, "ground_truth": 0}, {"key": "c8ebf6f48257a704202c7b6df238bc1cbfa838d7", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.5525397156337913, "ground_truth": 0}, {"key": "c8ebf6f48257a704202c7b6df238bc1cbfa838d7", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.6039318093153502, "ground_truth": 0}, {"key": "c8ebf6f48257a704202c7b6df238bc1cbfa838d7", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.4474602956516714, "ground_truth": 0}, {"key": "c8ebf6f48257a704202c7b6df238bc1cbfa838d7", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.6513548848351299, "ground_truth": 0}, {"key": "48e858dcb8dd62aad328f2c5f7fa052893d7304b", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.12336562290602548, "ground_truth": 0}, {"key": "48e858dcb8dd62aad328f2c5f7fa052893d7304b", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.32939171195483385, "ground_truth": 0}, {"key": "48e858dcb8dd62aad328f2c5f7fa052893d7304b", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.3486451512786185, "ground_truth": 0}, {"key": "48e858dcb8dd62aad328f2c5f7fa052893d7304b", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.14223188997480787, "ground_truth": 0}, {"key": "48e858dcb8dd62aad328f2c5f7fa052893d7304b", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.24508501245951422, "ground_truth": 0}, {"key": "1522da440cb538c8fc60f254efcb65e8378065a1", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.5774953861476557, "ground_truth": 0}, {"key": "1522da440cb538c8fc60f254efcb65e8378065a1", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.48633155634097963, "ground_truth": 0}, {"key": "1522da440cb538c8fc60f254efcb65e8378065a1", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.49804688083913073, "ground_truth": 0}, {"key": "1522da440cb538c8fc60f254efcb65e8378065a1", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.5117165930624097, "ground_truth": 0}, {"key": "1522da440cb538c8fc60f254efcb65e8378065a1", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.4668456054506545, "ground_truth": 0}, {"key": "0b40c6061cfd6a745886150c46eb75a7f43b4efa", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.3904758164482386, "ground_truth": 0}, {"key": "0b40c6061cfd6a745886150c46eb75a7f43b4efa", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.6723317139634439, "ground_truth": 0}, {"key": "0b40c6061cfd6a745886150c46eb75a7f43b4efa", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.7634837626112527, "ground_truth": 0}, {"key": "0b40c6061cfd6a745886150c46eb75a7f43b4efa", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.46490156170815683, "ground_truth": 0}, {"key": "0b40c6061cfd6a745886150c46eb75a7f43b4efa", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.7279754232159013, "ground_truth": 0}, {"key": "730655d5d1f29496344388805a891c3e3fd2a64e", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.7592254005370084, "ground_truth": 0}, {"key": "730655d5d1f29496344388805a891c3e3fd2a64e", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.390475825934884, "ground_truth": 0}, {"key": "730655d5d1f29496344388805a891c3e3fd2a64e", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.4590761304279187, "ground_truth": 0}, {"key": "730655d5d1f29496344388805a891c3e3fd2a64e", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.6584174987989178, "ground_truth": 0}, {"key": "730655d5d1f29496344388805a891c3e3fd2a64e", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.45907613209733095, "ground_truth": 0}, {"key": "399877dd5e90d151e29ad67fdeb6fa093632e0e1", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.3775406607694571, "ground_truth": 0}, {"key": "399877dd5e90d151e29ad67fdeb6fa093632e0e1", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.5486734816587001, "ground_truth": 0}, {"key": "399877dd5e90d151e29ad67fdeb6fa093632e0e1", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.35936412820028296, "ground_truth": 0}, {"key": "399877dd5e90d151e29ad67fdeb6fa093632e0e1", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.23651622997408625, "ground_truth": 0}, {"key": "399877dd5e90d151e29ad67fdeb6fa093632e0e1", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.19806417174108867, "ground_truth": 0}, {"key": "67fc9fa49a2c443dcbab030b9c6247a662716bc9", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.3923368398492983, "ground_truth": 0}, {"key": "67fc9fa49a2c443dcbab030b9c6247a662716bc9", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.32252598840312796, "ground_truth": 0}, {"key": "67fc9fa49a2c443dcbab030b9c6247a662716bc9", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.13206615696406218, "ground_truth": 0}, {"key": "67fc9fa49a2c443dcbab030b9c6247a662716bc9", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.3942009462864339, "ground_truth": 0}, {"key": "67fc9fa49a2c443dcbab030b9c6247a662716bc9", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.3363310482678596, "ground_truth": 0}, {"key": "8a44f223fc67ed0d5f946517f77c2291d6c4a027", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.5660185576471808, "ground_truth": 0}, {"key": "8a44f223fc67ed0d5f946517f77c2291d6c4a027", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.5, "ground_truth": 0}, {"key": "8a44f223fc67ed0d5f946517f77c2291d6c4a027", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.31573597799855335, "ground_truth": 0}, {"key": "8a44f223fc67ed0d5f946517f77c2291d6c4a027", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.24508501386556533, "ground_truth": 0}, {"key": "8a44f223fc67ed0d5f946517f77c2291d6c4a027", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.312370001531812, "ground_truth": 0}, {"key": "a3906e4f27942e2742d5cc9a3241980e338e0d30", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.24798742478523775, "ground_truth": 0}, {"key": "a3906e4f27942e2742d5cc9a3241980e338e0d30", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.3468730961124588, "ground_truth": 0}, {"key": "a3906e4f27942e2742d5cc9a3241980e338e0d30", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.39420094270300016, "ground_truth": 0}, {"key": "a3906e4f27942e2742d5cc9a3241980e338e0d30", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.4263216112329591, "ground_truth": 0}, {"key": "a3906e4f27942e2742d5cc9a3241980e338e0d30", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.3593641305958013, "ground_truth": 0}, {"key": "1e9f089602e8ab42ae65e273d866b53bdf9501bc", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.5292634170106251, "ground_truth": 0}, {"key": "1e9f089602e8ab42ae65e273d866b53bdf9501bc", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.5409238886963335, "ground_truth": 0}, {"key": "1e9f089602e8ab42ae65e273d866b53bdf9501bc", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.31573598145333803, "ground_truth": 0}, {"key": "1e9f089602e8ab42ae65e273d866b53bdf9501bc", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.7170118971875095, "ground_truth": 0}, {"key": "1e9f089602e8ab42ae65e273d866b53bdf9501bc", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.7490872210441429, "ground_truth": 0}, {"key": "768682d2f556e103bad77ad7aaa0660181747d1c", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.18594720549170898, "ground_truth": 0}, {"key": "768682d2f556e103bad77ad7aaa0660181747d1c", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.41679665818687667, "ground_truth": 0}, {"key": "768682d2f556e103bad77ad7aaa0660181747d1c", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.44552953728116046, "ground_truth": 0}, {"key": "768682d2f556e103bad77ad7aaa0660181747d1c", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.237929906311002, "ground_truth": 0}, {"key": "768682d2f556e103bad77ad7aaa0660181747d1c", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.6584174875587393, "ground_truth": 0}, {"key": "2806f716e41ce224a3862eb2bc50e214bc5037d8", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.8783142412365956, "ground_truth": 0}, {"key": "2806f716e41ce224a3862eb2bc50e214bc5037d8", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.8688267747798282, "ground_truth": 0}, {"key": "2806f716e41ce224a3862eb2bc50e214bc5037d8", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.5774953612061654, "ground_truth": 0}, {"key": "2806f716e41ce224a3862eb2bc50e214bc5037d8", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.8606036142117814, "ground_truth": 0}, {"key": "2806f716e41ce224a3862eb2bc50e214bc5037d8", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.9124361602877931, "ground_truth": 0}, {"key": "49d1a193a2c477f5861b593f06681b35b0e49573", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.16238002080857825, "ground_truth": 0}, {"key": "49d1a193a2c477f5861b593f06681b35b0e49573", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.2538610196730345, "ground_truth": 0}, {"key": "49d1a193a2c477f5861b593f06681b35b0e49573", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.3665897225356787, "ground_truth": 0}, {"key": "49d1a193a2c477f5861b593f06681b35b0e49573", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.24508501987220305, "ground_truth": 0}, {"key": "49d1a193a2c477f5861b593f06681b35b0e49573", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.33982763509616576, "ground_truth": 0}, {"key": "d603649af5260edbbe0474bcbb2e83e7340372d3", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.2538610174342187, "ground_truth": 0}, {"key": "d603649af5260edbbe0474bcbb2e83e7340372d3", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.294214967242765, "ground_truth": 0}, {"key": "d603649af5260edbbe0474bcbb2e83e7340372d3", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.2094696915748892, "ground_truth": 0}, {"key": "d603649af5260edbbe0474bcbb2e83e7340372d3", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.4941408762560607, "ground_truth": 0}, {"key": "d603649af5260edbbe0474bcbb2e83e7340372d3", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.2766905325782049, "ground_truth": 0}, {"key": "241c3bfcde3e19fb8f0e5d0273ccb06155a2d86b", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.36840570214723595, "ground_truth": 0}, {"key": "241c3bfcde3e19fb8f0e5d0273ccb06155a2d86b", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.1441488607886167, "ground_truth": 0}, {"key": "241c3bfcde3e19fb8f0e5d0273ccb06155a2d86b", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.3023910791906174, "ground_truth": 0}, {"key": "241c3bfcde3e19fb8f0e5d0273ccb06155a2d86b", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.282988114203487, "ground_truth": 0}, {"key": "241c3bfcde3e19fb8f0e5d0273ccb06155a2d86b", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.3557748834519229, "ground_truth": 0}, {"key": "cc8898d831bb770da703c284d4a811f16cb4035b", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.36840570617470814, "ground_truth": 0}, {"key": "cc8898d831bb770da703c284d4a811f16cb4035b", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.44167301489952976, "ground_truth": 0}, {"key": "cc8898d831bb770da703c284d4a811f16cb4035b", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.33633104878389297, "ground_truth": 0}, {"key": "cc8898d831bb770da703c284d4a811f16cb4035b", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.3073580288151308, "ground_truth": 0}, {"key": "cc8898d831bb770da703c284d4a811f16cb4035b", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.36658972581589855, "ground_truth": 0}, {"key": "e5685719d330bf84ed7691a9a591e04e6a6226b8", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.28776782033870574, "ground_truth": 0}, {"key": "e5685719d330bf84ed7691a9a591e04e6a6226b8", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.3242353859198676, "ground_truth": 0}, {"key": "e5685719d330bf84ed7691a9a591e04e6a6226b8", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.3738758210624393, "ground_truth": 0}, {"key": "e5685719d330bf84ed7691a9a591e04e6a6226b8", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.3886180266603686, "ground_truth": 0}, {"key": "e5685719d330bf84ed7691a9a591e04e6a6226b8", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.5983121627921727, "ground_truth": 0}, {"key": "bc868bcd37d2463875c4c685c582449069992a76", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.25683200125944994, "ground_truth": 0}, {"key": "bc868bcd37d2463875c4c685c582449069992a76", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.18952109454443936, "ground_truth": 0}, {"key": "bc868bcd37d2463875c4c685c582449069992a76", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.22815650281098057, "ground_truth": 0}, {"key": "bc868bcd37d2463875c4c685c582449069992a76", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.4186969228124463, "ground_truth": 0}, {"key": "bc868bcd37d2463875c4c685c582449069992a76", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.1835936381624488, "ground_truth": 0}, {"key": "c6369011986d295ce197e7304e14b207dab4c0aa", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.3960681889105649, "ground_truth": 0}, {"key": "c6369011986d295ce197e7304e14b207dab4c0aa", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.4416730106804716, "ground_truth": 0}, {"key": "c6369011986d295ce197e7304e14b207dab4c0aa", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.44552954684609697, "ground_truth": 0}, {"key": "c6369011986d295ce197e7304e14b207dab4c0aa", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.17441027576494045, "ground_truth": 0}, {"key": "c6369011986d295ce197e7304e14b207dab4c0aa", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.6001883391918619, "ground_truth": 0}, {"key": "c4e4f565d15f76b1e367d4fc2e7a2648c3cd395c", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.24220563823472666, "ground_truth": 0}, {"key": "c4e4f565d15f76b1e367d4fc2e7a2648c3cd395c", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.3174262733672123, "ground_truth": 0}, {"key": "c4e4f565d15f76b1e367d4fc2e7a2648c3cd395c", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.11596072439803926, "ground_truth": 0}, {"key": "c4e4f565d15f76b1e367d4fc2e7a2648c3cd395c", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.4416730195268171, "ground_truth": 0}, {"key": "c4e4f565d15f76b1e367d4fc2e7a2648c3cd395c", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.3486451435162539, "ground_truth": 0}, {"key": "32fe9f0f2eedaf63c9fd0314ab92c4b46297e260", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.09534945584776883, "ground_truth": 0}, {"key": "32fe9f0f2eedaf63c9fd0314ab92c4b46297e260", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.08882028633055276, "ground_truth": 0}, {"key": "32fe9f0f2eedaf63c9fd0314ab92c4b46297e260", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.1520322405441107, "ground_truth": 0}, {"key": "32fe9f0f2eedaf63c9fd0314ab92c4b46297e260", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.11757213141029677, "ground_truth": 0}, {"key": "32fe9f0f2eedaf63c9fd0314ab92c4b46297e260", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.12940274145833722, "ground_truth": 0}, {"key": "41698f361bcf6415f711719ed0c2f6817205c091", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.6424324752393273, "ground_truth": 0}, {"key": "41698f361bcf6415f711719ed0c2f6817205c091", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.581303086124738, "ground_truth": 0}, {"key": "41698f361bcf6415f711719ed0c2f6817205c091", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.8128673115185644, "ground_truth": 0}, {"key": "41698f361bcf6415f711719ed0c2f6817205c091", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.6424324758866796, "ground_truth": 0}, {"key": "41698f361bcf6415f711719ed0c2f6817205c091", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.5679366060235583, "ground_truth": 0}, {"key": "f040d657ee146cd131d34aeb31d6728b4f996666", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.6424324629365759, "ground_truth": 0}, {"key": "f040d657ee146cd131d34aeb31d6728b4f996666", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.07640768340391405, "ground_truth": 0}, {"key": "f040d657ee146cd131d34aeb31d6728b4f996666", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.6242935147426334, "ground_truth": 0}, {"key": "f040d657ee146cd131d34aeb31d6728b4f996666", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.801935820921814, "ground_truth": 0}, {"key": "f040d657ee146cd131d34aeb31d6728b4f996666", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.44167303321382345, "ground_truth": 0}, {"key": "1823e1e750046606e4be0e8710f1d74998783e41", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.4035668552259941, "ground_truth": 0}, {"key": "1823e1e750046606e4be0e8710f1d74998783e41", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.6150878417839669, "ground_truth": 0}, {"key": "1823e1e750046606e4be0e8710f1d74998783e41", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.6808786285423439, "ground_truth": 0}, {"key": "1823e1e750046606e4be0e8710f1d74998783e41", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.6334102652524578, "ground_truth": 0}, {"key": "1823e1e750046606e4be0e8710f1d74998783e41", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.60018836309622, "ground_truth": 0}, {"key": "6fae638166ee95509fbab3b28ac1c0ba0b088c79", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.4804786520419252, "ground_truth": 0}, {"key": "6fae638166ee95509fbab3b28ac1c0ba0b088c79", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.6774740128373753, "ground_truth": 0}, {"key": "6fae638166ee95509fbab3b28ac1c0ba0b088c79", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.674050474532556, "ground_truth": 0}, {"key": "6fae638166ee95509fbab3b28ac1c0ba0b088c79", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.3557748791007306, "ground_truth": 0}, {"key": "6fae638166ee95509fbab3b28ac1c0ba0b088c79", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.5888891374960714, "ground_truth": 0}, {"key": "00be40289d0aea65afd2da6431db8a9fc8efc9c0", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.17667161471121112, "ground_truth": 0}, {"key": "00be40289d0aea65afd2da6431db8a9fc8efc9c0", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.2200071010817029, "ground_truth": 0}, {"key": "00be40289d0aea65afd2da6431db8a9fc8efc9c0", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.1412814261581035, "ground_truth": 0}, {"key": "00be40289d0aea65afd2da6431db8a9fc8efc9c0", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.17553806435834146, "ground_truth": 0}, {"key": "00be40289d0aea65afd2da6431db8a9fc8efc9c0", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.14128141931758925, "ground_truth": 0}, {"key": "50dc0ca6cbbd4f9c3761fbb3ad9e7d7ba85bd9b3", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.22541661210461772, "ground_truth": 0}, {"key": "50dc0ca6cbbd4f9c3761fbb3ad9e7d7ba85bd9b3", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.6076631600791106, "ground_truth": 0}, {"key": "50dc0ca6cbbd4f9c3761fbb3ad9e7d7ba85bd9b3", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.4843800871915289, "ground_truth": 0}, {"key": "50dc0ca6cbbd4f9c3761fbb3ad9e7d7ba85bd9b3", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.8152324845303506, "ground_truth": 0}, {"key": "50dc0ca6cbbd4f9c3761fbb3ad9e7d7ba85bd9b3", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.2845759935261111, "ground_truth": 0}, {"key": "28b0e5240a7c3088fc62a70628b146bb40b6b853", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.6150878420645933, "ground_truth": 0}, {"key": "28b0e5240a7c3088fc62a70628b146bb40b6b853", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.5755879930269365, "ground_truth": 0}, {"key": "28b0e5240a7c3088fc62a70628b146bb40b6b853", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.8848377758623667, "ground_truth": 0}, {"key": "28b0e5240a7c3088fc62a70628b146bb40b6b853", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.6076631628330348, "ground_truth": 0}, {"key": "28b0e5240a7c3088fc62a70628b146bb40b6b853", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.724870288709659, "ground_truth": 0}, {"key": "44bdf9aa9712197110017fca533785653210f1ea", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.5506073709968817, "ground_truth": 0}, {"key": "44bdf9aa9712197110017fca533785653210f1ea", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.4359015204376885, "ground_truth": 0}, {"key": "44bdf9aa9712197110017fca533785653210f1ea", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.43206339742724414, "ground_truth": 0}, {"key": "44bdf9aa9712197110017fca533785653210f1ea", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.3867634431835503, "ground_truth": 0}, {"key": "44bdf9aa9712197110017fca533785653210f1ea", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.2942149800367148, "ground_truth": 0}, {"key": "879e68a2b78b3cf3f5c2581bbf6093871143ed7b", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.7772998466175653, "ground_truth": 0}, {"key": "879e68a2b78b3cf3f5c2581bbf6093871143ed7b", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.6001883753960611, "ground_truth": 0}, {"key": "879e68a2b78b3cf3f5c2581bbf6093871143ed7b", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.6654105427308176, "ground_truth": 0}, {"key": "879e68a2b78b3cf3f5c2581bbf6093871143ed7b", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.7690802496934905, "ground_truth": 0}, {"key": "879e68a2b78b3cf3f5c2581bbf6093871143ed7b", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.694302669904653, "ground_truth": 0}, {"key": "980051ddbf137ec06e7aeead2acb598bae388520", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.14511536188455026, "ground_truth": 0}, {"key": "980051ddbf137ec06e7aeead2acb598bae388520", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.39793841687407155, "ground_truth": 0}, {"key": "980051ddbf137ec06e7aeead2acb598bae388520", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.20689405203431163, "ground_truth": 0}, {"key": "980051ddbf137ec06e7aeead2acb598bae388520", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.17106117949797076, "ground_truth": 0}, {"key": "980051ddbf137ec06e7aeead2acb598bae388520", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.41111087878242075, "ground_truth": 0}, {"key": "45b9fb89ac2724f2d7de56b2f8c9397bca03326e", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.3242354075377331, "ground_truth": 0}, {"key": "45b9fb89ac2724f2d7de56b2f8c9397bca03326e", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.3106943938879979, "ground_truth": 0}, {"key": "45b9fb89ac2724f2d7de56b2f8c9397bca03326e", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.27825679183265295, "ground_truth": 0}, {"key": "45b9fb89ac2724f2d7de56b2f8c9397bca03326e", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.2043419020397734, "ground_truth": 0}, {"key": "45b9fb89ac2724f2d7de56b2f8c9397bca03326e", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.1789559037488245, "ground_truth": 0}, {"key": "b427165e1be5e9b6e6067fc5f6591c02bfb93333", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.16776334518563796, "ground_truth": 0}, {"key": "b427165e1be5e9b6e6067fc5f6591c02bfb93333", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.21076628755984503, "ground_truth": 0}, {"key": "b427165e1be5e9b6e6067fc5f6591c02bfb93333", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.18713267274088344, "ground_truth": 0}, {"key": "b427165e1be5e9b6e6067fc5f6591c02bfb93333", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.28298812477394586, "ground_truth": 0}, {"key": "b427165e1be5e9b6e6067fc5f6591c02bfb93333", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.3593641390274569, "ground_truth": 0}, {"key": "a9a2880bd65c6b3835d19987ebcbd3d09010a0c3", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.2436424499650312, "ground_truth": 0}, {"key": "a9a2880bd65c6b3835d19987ebcbd3d09010a0c3", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.191932790011911, "ground_truth": 0}, {"key": "a9a2880bd65c6b3835d19987ebcbd3d09010a0c3", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.16559312113321867, "ground_truth": 0}, {"key": "a9a2880bd65c6b3835d19987ebcbd3d09010a0c3", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.5234203636602772, "ground_truth": 0}, {"key": "a9a2880bd65c6b3835d19987ebcbd3d09010a0c3", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.1721718480920616, "ground_truth": 0}, {"key": "0c67e8d5a91f3c7d9c53e29b8d0a25cf8db21b54", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.1294027329358645, "ground_truth": 0}, {"key": "0c67e8d5a91f3c7d9c53e29b8d0a25cf8db21b54", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.35577486509314477, "ground_truth": 0}, {"key": "0c67e8d5a91f3c7d9c53e29b8d0a25cf8db21b54", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.5964331145317929, "ground_truth": 0}, {"key": "0c67e8d5a91f3c7d9c53e29b8d0a25cf8db21b54", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.38306418652890495, "ground_truth": 0}, {"key": "0c67e8d5a91f3c7d9c53e29b8d0a25cf8db21b54", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.350421379496527, "ground_truth": 0}, {"key": "bc1c4d12aabdcecab3d87c6f9a898e41c7cd3821", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.4765796543032551, "ground_truth": 0}, {"key": "bc1c4d12aabdcecab3d87c6f9a898e41c7cd3821", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.37754066861847774, "ground_truth": 0}, {"key": "bc1c4d12aabdcecab3d87c6f9a898e41c7cd3821", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.496093829476218, "ground_truth": 0}, {"key": "bc1c4d12aabdcecab3d87c6f9a898e41c7cd3821", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.6876299883620528, "ground_truth": 0}, {"key": "bc1c4d12aabdcecab3d87c6f9a898e41c7cd3821", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.43398147914040575, "ground_truth": 0}, {"key": "7b76a0b5e6006587b65ad70ac2e4953ca1e2d4d1", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.5563996190234702, "ground_truth": 0}, {"key": "7b76a0b5e6006587b65ad70ac2e4953ca1e2d4d1", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.39606818218140377, "ground_truth": 0}, {"key": "7b76a0b5e6006587b65ad70ac2e4953ca1e2d4d1", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.4282333915080726, "ground_truth": 0}, {"key": "7b76a0b5e6006587b65ad70ac2e4953ca1e2d4d1", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.5774953488727901, "ground_truth": 0}, {"key": "7b76a0b5e6006587b65ad70ac2e4953ca1e2d4d1", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.5292633860242638, "ground_truth": 0}, {"key": "8a0976b5b0811c919669e8aed7274e1d0fa14679", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.47073660136402257, "ground_truth": 0}, {"key": "8a0976b5b0811c919669e8aed7274e1d0fa14679", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.6001883514461815, "ground_truth": 0}, {"key": "8a0976b5b0811c919669e8aed7274e1d0fa14679", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.2942149690297385, "ground_truth": 0}, {"key": "8a0976b5b0811c919669e8aed7274e1d0fa14679", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.31573598248417223, "ground_truth": 0}, {"key": "8a0976b5b0811c919669e8aed7274e1d0fa14679", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.40544873734914705, "ground_truth": 0}, {"key": "69788d586d71bf36d2818ca097308747f6ab25ab", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.26284185870648924, "ground_truth": 0}, {"key": "69788d586d71bf36d2818ca097308747f6ab25ab", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.7138307374081003, "ground_truth": 0}, {"key": "69788d586d71bf36d2818ca097308747f6ab25ab", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.28457601315530295, "ground_truth": 0}, {"key": "69788d586d71bf36d2818ca097308747f6ab25ab", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.12421301220553423, "ground_truth": 0}, {"key": "69788d586d71bf36d2818ca097308747f6ab25ab", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.2991051859942721, "ground_truth": 0}, {"key": "82e9c77478dfed129ceca1a152ba54e20f7f5a88", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.16995623256723996, "ground_truth": 0}, {"key": "82e9c77478dfed129ceca1a152ba54e20f7f5a88", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.6113819729870563, "ground_truth": 0}, {"key": "82e9c77478dfed129ceca1a152ba54e20f7f5a88", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.4921881363902065, "ground_truth": 0}, {"key": "82e9c77478dfed129ceca1a152ba54e20f7f5a88", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.5078118598491593, "ground_truth": 0}, {"key": "82e9c77478dfed129ceca1a152ba54e20f7f5a88", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.6039318332659527, "ground_truth": 0}, {"key": "e1b904fd0a3f74c3e01831acb6d4a67c0d1b642b", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.5486734888639734, "ground_truth": 0}, {"key": "e1b904fd0a3f74c3e01831acb6d4a67c0d1b642b", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.3380771404687235, "ground_truth": 0}, {"key": "e1b904fd0a3f74c3e01831acb6d4a67c0d1b642b", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.4824291117895509, "ground_truth": 0}, {"key": "e1b904fd0a3f74c3e01831acb6d4a67c0d1b642b", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.4668456113999239, "ground_truth": 0}, {"key": "e1b904fd0a3f74c3e01831acb6d4a67c0d1b642b", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.3904758393634448, "ground_truth": 0}, {"key": "1cecb5f24805afcc15eb5cfa0500130f107c8bcb", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.16344543768416683, "ground_truth": 0}, {"key": "1cecb5f24805afcc15eb5cfa0500130f107c8bcb", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.25982564501714284, "ground_truth": 0}, {"key": "1cecb5f24805afcc15eb5cfa0500130f107c8bcb", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.5409238589795717, "ground_truth": 0}, {"key": "1cecb5f24805afcc15eb5cfa0500130f107c8bcb", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.2720245661355002, "ground_truth": 0}, {"key": "1cecb5f24805afcc15eb5cfa0500130f107c8bcb", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.20307462650639402, "ground_truth": 0}, {"key": "d3da69405b687367de6260d74db8726423b6884a", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.3259495165103468, "ground_truth": 0}, {"key": "d3da69405b687367de6260d74db8726423b6884a", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.42823340251795794, "ground_truth": 0}, {"key": "d3da69405b687367de6260d74db8726423b6884a", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.1422318903954767, "ground_truth": 0}, {"key": "d3da69405b687367de6260d74db8726423b6884a", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.2133771630202821, "ground_truth": 0}, {"key": "d3da69405b687367de6260d74db8726423b6884a", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.5389831923820996, "ground_truth": 0}, {"key": "9b7836ba179053fecec671168589694bd4ba08f1", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.7386690779522531, "ground_truth": 0}, {"key": "9b7836ba179053fecec671168589694bd4ba08f1", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.6370308129488982, "ground_truth": 0}, {"key": "9b7836ba179053fecec671168589694bd4ba08f1", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.564098462860828, "ground_truth": 0}, {"key": "9b7836ba179053fecec671168589694bd4ba08f1", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.5234203636049429, "ground_truth": 0}, {"key": "9b7836ba179053fecec671168589694bd4ba08f1", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.6279512062013675, "ground_truth": 0}, {"key": "9483ae6d83dd71a96e91eee727a9ce7c0f3cf6ab", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.9900635818998155, "ground_truth": 0}, {"key": "9483ae6d83dd71a96e91eee727a9ce7c0f3cf6ab", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.9763105287267171, "ground_truth": 0}, {"key": "9483ae6d83dd71a96e91eee727a9ce7c0f3cf6ab", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.9600626830840251, "ground_truth": 0}, {"key": "9483ae6d83dd71a96e91eee727a9ce7c0f3cf6ab", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.9887554395033802, "ground_truth": 0}, {"key": "9483ae6d83dd71a96e91eee727a9ce7c0f3cf6ab", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.9804313244140906, "ground_truth": 0}, {"key": "ea29e498c303964fc39c856ddf7037d5dfbc93fb", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.17441028047116547, "ground_truth": 0}, {"key": "ea29e498c303964fc39c856ddf7037d5dfbc93fb", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.5058591224461868, "ground_truth": 0}, {"key": "ea29e498c303964fc39c856ddf7037d5dfbc93fb", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.484380091098144, "ground_truth": 0}, {"key": "ea29e498c303964fc39c856ddf7037d5dfbc93fb", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.151027807189531, "ground_truth": 0}, {"key": "ea29e498c303964fc39c856ddf7037d5dfbc93fb", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.649578625333863, "ground_truth": 0}, {"key": "e1aad9da59a32a4443010b092eba1b68725c8467", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.39606815337705314, "ground_truth": 0}, {"key": "e1aad9da59a32a4443010b092eba1b68725c8467", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.45907612705467904, "ground_truth": 0}, {"key": "e1aad9da59a32a4443010b092eba1b68725c8467", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.13753246985310538, "ground_truth": 0}, {"key": "e1aad9da59a32a4443010b092eba1b68725c8467", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.2814055934594158, "ground_truth": 0}, {"key": "e1aad9da59a32a4443010b092eba1b68725c8467", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.3073579916064975, "ground_truth": 0}, {"key": "6897f34c8e510dc95524dbfceefe20717776f761", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.6206215903004467, "ground_truth": 0}, {"key": "6897f34c8e510dc95524dbfceefe20717776f761", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.17553807428148313, "ground_truth": 0}, {"key": "6897f34c8e510dc95524dbfceefe20717776f761", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.3830641943057277, "ground_truth": 0}, {"key": "6897f34c8e510dc95524dbfceefe20717776f761", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.49023562572388535, "ground_truth": 0}, {"key": "6897f34c8e510dc95524dbfceefe20717776f761", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.8354835442647477, "ground_truth": 0}, {"key": "c0846f0148c9fd60433c8d2bf85e3437b49f9ec4", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.361164715288079, "ground_truth": 0}, {"key": "c0846f0148c9fd60433c8d2bf85e3437b49f9ec4", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.18242552414712698, "ground_truth": 0}, {"key": "c0846f0148c9fd60433c8d2bf85e3437b49f9ec4", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.27825678373613427, "ground_truth": 0}, {"key": "c0846f0148c9fd60433c8d2bf85e3437b49f9ec4", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.38676341376993034, "ground_truth": 0}, {"key": "c0846f0148c9fd60433c8d2bf85e3437b49f9ec4", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.1677633408784279, "ground_truth": 0}, {"key": "dfbb5a2d5844f89537141a2b5a48040e68327010", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.3208213179383114, "ground_truth": 0}, {"key": "dfbb5a2d5844f89537141a2b5a48040e68327010", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.5039061573797484, "ground_truth": 0}, {"key": "dfbb5a2d5844f89537141a2b5a48040e68327010", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.37937840208735446, "ground_truth": 0}, {"key": "dfbb5a2d5844f89537141a2b5a48040e68327010", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.5, "ground_truth": 0}, {"key": "dfbb5a2d5844f89537141a2b5a48040e68327010", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.699254418331517, "ground_truth": 0}, {"key": "0aa0562353120d93357dc00a05ff4d2bc0312715", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.40168779912302965, "ground_truth": 0}, {"key": "0aa0562353120d93357dc00a05ff4d2bc0312715", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.24364245245017235, "ground_truth": 0}, {"key": "0aa0562353120d93357dc00a05ff4d2bc0312715", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.4416730100970697, "ground_truth": 0}, {"key": "0aa0562353120d93357dc00a05ff4d2bc0312715", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.2643583585371611, "ground_truth": 0}, {"key": "0aa0562353120d93357dc00a05ff4d2bc0312715", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.7401743563151006, "ground_truth": 0}, {"key": "fd5ae29a3ed2e9093c12dcbb12fcb5c67217b0f5", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.33807712560673886, "ground_truth": 0}, {"key": "fd5ae29a3ed2e9093c12dcbb12fcb5c67217b0f5", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.3468730838118645, "ground_truth": 0}, {"key": "fd5ae29a3ed2e9093c12dcbb12fcb5c67217b0f5", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.24653334026698268, "ground_truth": 0}, {"key": "fd5ae29a3ed2e9093c12dcbb12fcb5c67217b0f5", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.21733751768821982, "ground_truth": 0}, {"key": "fd5ae29a3ed2e9093c12dcbb12fcb5c67217b0f5", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.23792989679420082, "ground_truth": 0}, {"key": "4df7a53f5e24347a53d5bf3b8c92bef21561f2c4", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.14223188600713144, "ground_truth": 0}, {"key": "4df7a53f5e24347a53d5bf3b8c92bef21561f2c4", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.28457602453417774, "ground_truth": 0}, {"key": "4df7a53f5e24347a53d5bf3b8c92bef21561f2c4", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.32082129892208255, "ground_truth": 0}, {"key": "4df7a53f5e24347a53d5bf3b8c92bef21561f2c4", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.06560483576447203, "ground_truth": 0}, {"key": "4df7a53f5e24347a53d5bf3b8c92bef21561f2c4", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.392336824705863, "ground_truth": 0}, {"key": "166fe0c3d3f400a48ec5fd716c675384512f152c", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.11516222736762236, "ground_truth": 0}, {"key": "166fe0c3d3f400a48ec5fd716c675384512f152c", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.11279539770618398, "ground_truth": 0}, {"key": "166fe0c3d3f400a48ec5fd716c675384512f152c", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.12252321056655639, "ground_truth": 0}, {"key": "166fe0c3d3f400a48ec5fd716c675384512f152c", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.14903530705401064, "ground_truth": 0}, {"key": "166fe0c3d3f400a48ec5fd716c675384512f152c", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.22135070751005428, "ground_truth": 0}, {"key": "69e313e0e6e7603f96a3783cb7d1ada68ace288f", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.5774953806081401, "ground_truth": 0}, {"key": "69e313e0e6e7603f96a3783cb7d1ada68ace288f", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.5832033475250094, "ground_truth": 0}, {"key": "69e313e0e6e7603f96a3783cb7d1ada68ace288f", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.4186969124354306, "ground_truth": 0}, {"key": "69e313e0e6e7603f96a3783cb7d1ada68ace288f", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.5736784017960139, "ground_truth": 0}, {"key": "69e313e0e6e7603f96a3783cb7d1ada68ace288f", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.43590151472874183, "ground_truth": 0}, {"key": "21ff7b91537b3ab2e73dff1f982a669b8658b0e9", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.2782568138411715, "ground_truth": 0}, {"key": "21ff7b91537b3ab2e73dff1f982a669b8658b0e9", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.16132023216856398, "ground_truth": 0}, {"key": "21ff7b91537b3ab2e73dff1f982a669b8658b0e9", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.5117166107761598, "ground_truth": 0}, {"key": "21ff7b91537b3ab2e73dff1f982a669b8658b0e9", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.31069439347908046, "ground_truth": 0}, {"key": "21ff7b91537b3ab2e73dff1f982a669b8658b0e9", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.2393493443168762, "ground_truth": 0}, {"key": "963cbc7820b42eaa7b7a82d178c6a387a70a6a3c", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.44167299510221847, "ground_truth": 0}, {"key": "963cbc7820b42eaa7b7a82d178c6a387a70a6a3c", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.4378234895966587, "ground_truth": 0}, {"key": "963cbc7820b42eaa7b7a82d178c6a387a70a6a3c", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.35936415907789526, "ground_truth": 0}, {"key": "963cbc7820b42eaa7b7a82d178c6a387a70a6a3c", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.7008947960999306, "ground_truth": 0}, {"key": "963cbc7820b42eaa7b7a82d178c6a387a70a6a3c", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.6943026842828834, "ground_truth": 0}, {"key": "8180a77657661e975e3fac6c7fdbd8de97fd160e", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.9111797096289218, "ground_truth": 0}, {"key": "8180a77657661e975e3fac6c7fdbd8de97fd160e", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.910545397915399, "ground_truth": 0}, {"key": "8180a77657661e975e3fac6c7fdbd8de97fd160e", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.8807970869454261, "ground_truth": 0}, {"key": "8180a77657661e975e3fac6c7fdbd8de97fd160e", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.6601723728150964, "ground_truth": 0}, {"key": "8180a77657661e975e3fac6c7fdbd8de97fd160e", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.9196425345499533, "ground_truth": 0}, {"key": "6c498fd6de7ad5e5006732655050c1d97cc2af68", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.29746994650515984, "ground_truth": 0}, {"key": "6c498fd6de7ad5e5006732655050c1d97cc2af68", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.49804688892158056, "ground_truth": 0}, {"key": "6c498fd6de7ad5e5006732655050c1d97cc2af68", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.4092208019645508, "ground_truth": 0}, {"key": "6c498fd6de7ad5e5006732655050c1d97cc2af68", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.11757213986395482, "ground_truth": 0}, {"key": "6c498fd6de7ad5e5006732655050c1d97cc2af68", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.3830641896718224, "ground_truth": 0}, {"key": "fdb54e157f8f4e5a479dbc6288587e52fffde33f", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.6859494546115931, "ground_truth": 0}, {"key": "fdb54e157f8f4e5a479dbc6288587e52fffde33f", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.626124184338739, "ground_truth": 0}, {"key": "fdb54e157f8f4e5a479dbc6288587e52fffde33f", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.5428632599350297, "ground_truth": 0}, {"key": "fdb54e157f8f4e5a479dbc6288587e52fffde33f", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.5907791944045987, "ground_truth": 0}, {"key": "fdb54e157f8f4e5a479dbc6288587e52fffde33f", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.5, "ground_truth": 0}, {"key": "fc8f0e54e2627ebe705735f0565d77ca64579d92", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.2643583605317073, "ground_truth": 0}, {"key": "fc8f0e54e2627ebe705735f0565d77ca64579d92", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.4668455956906552, "ground_truth": 0}, {"key": "fc8f0e54e2627ebe705735f0565d77ca64579d92", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.30404168095855094, "ground_truth": 0}, {"key": "fc8f0e54e2627ebe705735f0565d77ca64579d92", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.3738758009841019, "ground_truth": 0}, {"key": "fc8f0e54e2627ebe705735f0565d77ca64579d92", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.3106944074512399, "ground_truth": 0}, {"key": "b000d4eac990440e136dc1e655a03d5669531d9b", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.6688802752784718, "ground_truth": 0}, {"key": "b000d4eac990440e136dc1e655a03d5669531d9b", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.42441200671525425, "ground_truth": 0}, {"key": "b000d4eac990440e136dc1e655a03d5669531d9b", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.6132365520335787, "ground_truth": 0}, {"key": "b000d4eac990440e136dc1e655a03d5669531d9b", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.7154239795695578, "ground_truth": 0}, {"key": "b000d4eac990440e136dc1e655a03d5669531d9b", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.5907792148079057, "ground_truth": 0}, {"key": "1064c47f3d7f0efa03368fe7eb01dd0836017339", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.25832597571554033, "ground_truth": 0}, {"key": "1064c47f3d7f0efa03368fe7eb01dd0836017339", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.5774953688795265, "ground_truth": 0}, {"key": "1064c47f3d7f0efa03368fe7eb01dd0836017339", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.3023910970266363, "ground_truth": 0}, {"key": "1064c47f3d7f0efa03368fe7eb01dd0836017339", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.3702253622040553, "ground_truth": 0}, {"key": "1064c47f3d7f0efa03368fe7eb01dd0836017339", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.28776781325772494, "ground_truth": 0}, {"key": "d79f1e9a2ddfcb61d80c944de53daebd4b5c7f6e", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.37937838524149853, "ground_truth": 0}, {"key": "d79f1e9a2ddfcb61d80c944de53daebd4b5c7f6e", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.14318770224633226, "ground_truth": 0}, {"key": "d79f1e9a2ddfcb61d80c944de53daebd4b5c7f6e", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.20689406119212492, "ground_truth": 0}, {"key": "d79f1e9a2ddfcb61d80c944de53daebd4b5c7f6e", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.10743747481391029, "ground_truth": 0}, {"key": "d79f1e9a2ddfcb61d80c944de53daebd4b5c7f6e", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.18952110596519417, "ground_truth": 0}, {"key": "87b5f1f872c849ec239bad4ccf487d048d4274b2", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.6671476721953314, "ground_truth": 0}, {"key": "87b5f1f872c849ec239bad4ccf487d048d4274b2", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.8670357579006003, "ground_truth": 0}, {"key": "87b5f1f872c849ec239bad4ccf487d048d4274b2", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.8354835490554294, "ground_truth": 0}, {"key": "87b5f1f872c849ec239bad4ccf487d048d4274b2", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.7041601294907855, "ground_truth": 0}, {"key": "87b5f1f872c849ec239bad4ccf487d048d4274b2", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.9661559666211784, "ground_truth": 0}, {"key": "9ea6d6a5cae86243c1c8899f7bab76e874c73b38", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.8969755724543197, "ground_truth": 0}, {"key": "9ea6d6a5cae86243c1c8899f7bab76e874c73b38", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.2958398686534379, "ground_truth": 0}, {"key": "9ea6d6a5cae86243c1c8899f7bab76e874c73b38", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.4785288348015135, "ground_truth": 0}, {"key": "9ea6d6a5cae86243c1c8899f7bab76e874c73b38", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.7956581000757994, "ground_truth": 0}, {"key": "9ea6d6a5cae86243c1c8899f7bab76e874c73b38", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.8418256484799529, "ground_truth": 0}, {"key": "a3cb529364dbdcd2af9e30ecfe56898be375870b", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.31912138858311245, "ground_truth": 0}, {"key": "a3cb529364dbdcd2af9e30ecfe56898be375870b", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.36477755347720403, "ground_truth": 0}, {"key": "a3cb529364dbdcd2af9e30ecfe56898be375870b", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.3611647189700218, "ground_truth": 0}, {"key": "a3cb529364dbdcd2af9e30ecfe56898be375870b", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.23792989987744265, "ground_truth": 0}, {"key": "a3cb529364dbdcd2af9e30ecfe56898be375870b", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.4960938248030624, "ground_truth": 0}, {"key": "f489b07406c653968a0ed21c00e28c9124e4a49b", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.5544704491286618, "ground_truth": 0}, {"key": "f489b07406c653968a0ed21c00e28c9124e4a49b", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.3942009404620647, "ground_truth": 0}, {"key": "f489b07406c653968a0ed21c00e28c9124e4a49b", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.7813305944514861, "ground_truth": 0}, {"key": "f489b07406c653968a0ed21c00e28c9124e4a49b", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.6334102662547086, "ground_truth": 0}, {"key": "f489b07406c653968a0ed21c00e28c9124e4a49b", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.5755879997435679, "ground_truth": 0}, {"key": "499fdb9bf024f6fbfd605792594372df22ec12f0", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.2295351986643008, "ground_truth": 0}, {"key": "499fdb9bf024f6fbfd605792594372df22ec12f0", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.3311197270984259, "ground_truth": 0}, {"key": "499fdb9bf024f6fbfd605792594372df22ec12f0", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.4320633885361239, "ground_truth": 0}, {"key": "499fdb9bf024f6fbfd605792594372df22ec12f0", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.30404168240644414, "ground_truth": 0}, {"key": "499fdb9bf024f6fbfd605792594372df22ec12f0", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.24364244623219333, "ground_truth": 0}, {"key": "9f49bf7ded4308f1601e4723d594d7c3b4883b32", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.23934934065873975, "ground_truth": 0}, {"key": "9f49bf7ded4308f1601e4723d594d7c3b4883b32", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.23651623780915906, "ground_truth": 0}, {"key": "9f49bf7ded4308f1601e4723d594d7c3b4883b32", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.2598256278520609, "ground_truth": 0}, {"key": "9f49bf7ded4308f1601e4723d594d7c3b4883b32", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.3415824802208404, "ground_truth": 0}, {"key": "9f49bf7ded4308f1601e4723d594d7c3b4883b32", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.4804786653456219, "ground_truth": 0}, {"key": "6bd843fe975d42b0f2d5eedb1a02d918e4a397f5", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.30404167046366487, "ground_truth": 0}, {"key": "6bd843fe975d42b0f2d5eedb1a02d918e4a397f5", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.45132652909380944, "ground_truth": 0}, {"key": "6bd843fe975d42b0f2d5eedb1a02d918e4a397f5", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.4378235112253904, "ground_truth": 0}, {"key": "6bd843fe975d42b0f2d5eedb1a02d918e4a397f5", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.602061591080151, "ground_truth": 0}, {"key": "6bd843fe975d42b0f2d5eedb1a02d918e4a397f5", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.5832033667962608, "ground_truth": 0}, {"key": "00aa8e3ba59f5fe71a096a5549f80faece10aa83", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.38491215395950634, "ground_truth": 0}, {"key": "00aa8e3ba59f5fe71a096a5549f80faece10aa83", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.45713671144590295, "ground_truth": 0}, {"key": "00aa8e3ba59f5fe71a096a5549f80faece10aa83", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.2893716909604313, "ground_truth": 0}, {"key": "00aa8e3ba59f5fe71a096a5549f80faece10aa83", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.2909808471690938, "ground_truth": 0}, {"key": "00aa8e3ba59f5fe71a096a5549f80faece10aa83", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.2751297341871375, "ground_truth": 0}, {"key": "bf0ea0373655184f69fb01b9aa833d21e7188e9e", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.310694392964036, "ground_truth": 0}, {"key": "bf0ea0373655184f69fb01b9aa833d21e7188e9e", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.28776781835742954, "ground_truth": 0}, {"key": "bf0ea0373655184f69fb01b9aa833d21e7188e9e", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.17553806625648527, "ground_truth": 0}, {"key": "bf0ea0373655184f69fb01b9aa833d21e7188e9e", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.1412814169364669, "ground_truth": 0}, {"key": "bf0ea0373655184f69fb01b9aa833d21e7188e9e", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.20689406217049255, "ground_truth": 0}, {"key": "e1afe080ecf3565b0103214c21f49e8b03741024", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.5679365984262279, "ground_truth": 0}, {"key": "e1afe080ecf3565b0103214c21f49e8b03741024", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.6842640384006929, "ground_truth": 0}, {"key": "e1afe080ecf3565b0103214c21f49e8b03741024", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.6909762975607736, "ground_truth": 0}, {"key": "e1afe080ecf3565b0103214c21f49e8b03741024", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.6442251142255433, "ground_truth": 0}, {"key": "e1afe080ecf3565b0103214c21f49e8b03741024", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.42059961801320506, "ground_truth": 0}, {"key": "05fa6152f08a3d64745030124428775768ee3afd", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.48633154464348627, "ground_truth": 0}, {"key": "05fa6152f08a3d64745030124428775768ee3afd", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.7090191333871176, "ground_truth": 0}, {"key": "05fa6152f08a3d64745030124428775768ee3afd", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.8705972662164336, "ground_truth": 0}, {"key": "05fa6152f08a3d64745030124428775768ee3afd", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.6688802638596704, "ground_truth": 0}, {"key": "05fa6152f08a3d64745030124428775768ee3afd", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.7122321949211816, "ground_truth": 0}, {"key": "8f80054060e5c2dde57666b5e3bddf6b70b34f3f", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.5039061867276757, "ground_truth": 0}, {"key": "8f80054060e5c2dde57666b5e3bddf6b70b34f3f", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.6926419794335664, "ground_truth": 0}, {"key": "8f80054060e5c2dde57666b5e3bddf6b70b34f3f", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.5983122014834584, "ground_truth": 0}, {"key": "8f80054060e5c2dde57666b5e3bddf6b70b34f3f", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.37754067593739393, "ground_truth": 0}, {"key": "8f80054060e5c2dde57666b5e3bddf6b70b34f3f", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.5234203685100768, "ground_truth": 0}, {"key": "f63877ffefceaf9a2a13a9277f4d861f9b9b8a73", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.8175744743403498, "ground_truth": 0}, {"key": "f63877ffefceaf9a2a13a9277f4d861f9b9b8a73", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.11357959089017032, "ground_truth": 0}, {"key": "f63877ffefceaf9a2a13a9277f4d861f9b9b8a73", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.7074047054758085, "ground_truth": 0}, {"key": "f63877ffefceaf9a2a13a9277f4d861f9b9b8a73", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.4882833726272026, "ground_truth": 0}, {"key": "f63877ffefceaf9a2a13a9277f4d861f9b9b8a73", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.861538202718159, "ground_truth": 0}, {"key": "e1e0fbee1f5df559fda3830710afb660f33cb7b5", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.3793783570758594, "ground_truth": 0}, {"key": "e1e0fbee1f5df559fda3830710afb660f33cb7b5", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.26588047972471923, "ground_truth": 0}, {"key": "e1e0fbee1f5df559fda3830710afb660f33cb7b5", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.3056973525471216, "ground_truth": 0}, {"key": "e1e0fbee1f5df559fda3830710afb660f33cb7b5", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.5273165294056164, "ground_truth": 0}, {"key": "e1e0fbee1f5df559fda3830710afb660f33cb7b5", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.11516223113239633, "ground_truth": 0}, {"key": "7d66246dc75062c5616067bbb379962c3934e52f", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.405448731052051, "ground_truth": 0}, {"key": "7d66246dc75062c5616067bbb379962c3934e52f", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.6406358726345899, "ground_truth": 0}, {"key": "7d66246dc75062c5616067bbb379962c3934e52f", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.31405055133600285, "ground_truth": 0}, {"key": "7d66246dc75062c5616067bbb379962c3934e52f", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.677474010797768, "ground_truth": 0}, {"key": "7d66246dc75062c5616067bbb379962c3934e52f", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.5195213316875579, "ground_truth": 0}, {"key": "09e62b334425ef4eee26be483a625858c91340eb", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.2861692161733224, "ground_truth": 0}, {"key": "09e62b334425ef4eee26be483a625858c91340eb", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.5583269897426996, "ground_truth": 0}, {"key": "09e62b334425ef4eee26be483a625858c91340eb", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.42823339951287276, "ground_truth": 0}, {"key": "09e62b334425ef4eee26be483a625858c91340eb", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.30074556387161283, "ground_truth": 0}, {"key": "09e62b334425ef4eee26be483a625858c91340eb", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.37754068794024154, "ground_truth": 0}, {"key": "32e769b0ced3ffbf79f695af69a2401897156c8c", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.36658974255307913, "ground_truth": 0}, {"key": "32e769b0ced3ffbf79f695af69a2401897156c8c", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.40544871299449176, "ground_truth": 0}, {"key": "32e769b0ced3ffbf79f695af69a2401897156c8c", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.6370308018073024, "ground_truth": 0}, {"key": "32e769b0ced3ffbf79f695af69a2401897156c8c", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.2845759983359203, "ground_truth": 0}, {"key": "32e769b0ced3ffbf79f695af69a2401897156c8c", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.40733340970209664, "ground_truth": 0}, {"key": "43d42fe40ada4406377bc3b45c123a75552c21a0", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.5583269770521321, "ground_truth": 0}, {"key": "43d42fe40ada4406377bc3b45c123a75552c21a0", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.6113819762535214, "ground_truth": 0}, {"key": "43d42fe40ada4406377bc3b45c123a75552c21a0", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.470736623437095, "ground_truth": 0}, {"key": "43d42fe40ada4406377bc3b45c123a75552c21a0", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.6566582474103583, "ground_truth": 0}, {"key": "43d42fe40ada4406377bc3b45c123a75552c21a0", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.7248702740080056, "ground_truth": 0}, {"key": "cec3e977a612e1481913d63934cfe578b9bcf3be", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.2538610089652811, "ground_truth": 0}, {"key": "cec3e977a612e1481913d63934cfe578b9bcf3be", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.3923368252730919, "ground_truth": 0}, {"key": "cec3e977a612e1481913d63934cfe578b9bcf3be", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.4474602992285772, "ground_truth": 0}, {"key": "cec3e977a612e1481913d63934cfe578b9bcf3be", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.14414884977364217, "ground_truth": 0}, {"key": "cec3e977a612e1481913d63934cfe578b9bcf3be", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.4378235123903123, "ground_truth": 0}, {"key": "2572185d9544f23c4ad02aeac1ae8ab7828fb4be", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.3665897485556172, "ground_truth": 0}, {"key": "2572185d9544f23c4ad02aeac1ae8ab7828fb4be", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.6723316983163712, "ground_truth": 0}, {"key": "2572185d9544f23c4ad02aeac1ae8ab7828fb4be", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.18126320771518065, "ground_truth": 0}, {"key": "2572185d9544f23c4ad02aeac1ae8ab7828fb4be", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.4263216096788664, "ground_truth": 0}, {"key": "2572185d9544f23c4ad02aeac1ae8ab7828fb4be", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.3293917329468351, "ground_truth": 0}, {"key": "3cc7c9639fb87922cfac315fbb55641e671a3d99", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.07864238037930409, "ground_truth": 0}, {"key": "3cc7c9639fb87922cfac315fbb55641e671a3d99", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.17441027213341204, "ground_truth": 0}, {"key": "3cc7c9639fb87922cfac315fbb55641e671a3d99", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.06608537370050854, "ground_truth": 0}, {"key": "3cc7c9639fb87922cfac315fbb55641e671a3d99", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.07423137004688256, "ground_truth": 0}, {"key": "3cc7c9639fb87922cfac315fbb55641e671a3d99", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.1602660320422896, "ground_truth": 0}, {"key": "374ae10f9cbb0719c889321f880a0671892336e4", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.2081789341785965, "ground_truth": 0}, {"key": "374ae10f9cbb0719c889321f880a0671892336e4", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.20307462755465283, "ground_truth": 0}, {"key": "374ae10f9cbb0719c889321f880a0671892336e4", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.10970577029055198, "ground_truth": 0}, {"key": "374ae10f9cbb0719c889321f880a0671892336e4", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.2751297260891135, "ground_truth": 0}, {"key": "374ae10f9cbb0719c889321f880a0671892336e4", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.2583259831749198, "ground_truth": 0}, {"key": "89a7bb5a0b120c5b50e9145c8f8f9bea3a90371a", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.7356416230208417, "ground_truth": 0}, {"key": "89a7bb5a0b120c5b50e9145c8f8f9bea3a90371a", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.8300437663836754, "ground_truth": 0}, {"key": "89a7bb5a0b120c5b50e9145c8f8f9bea3a90371a", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.9566341998183092, "ground_truth": 0}, {"key": "89a7bb5a0b120c5b50e9145c8f8f9bea3a90371a", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.7931059403954845, "ground_truth": 0}, {"key": "89a7bb5a0b120c5b50e9145c8f8f9bea3a90371a", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.8479677567327341, "ground_truth": 0}, {"key": "49d4ad731a44b7576e3e3271b1eee2f0219883c2", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.3433417188303109, "ground_truth": 0}, {"key": "49d4ad731a44b7576e3e3271b1eee2f0219883c2", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.7520125579212497, "ground_truth": 0}, {"key": "49d4ad731a44b7576e3e3271b1eee2f0219883c2", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.5698526572115665, "ground_truth": 0}, {"key": "49d4ad731a44b7576e3e3271b1eee2f0219883c2", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.651354872093867, "ground_truth": 0}, {"key": "49d4ad731a44b7576e3e3271b1eee2f0219883c2", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.7264256261265037, "ground_truth": 0}, {"key": "ab3c9bac8bcfef89da719c4aba8ea4eee71e4daf", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.8479677581452189, "ground_truth": 0}, {"key": "ab3c9bac8bcfef89da719c4aba8ea4eee71e4daf", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.808067205283763, "ground_truth": 0}, {"key": "ab3c9bac8bcfef89da719c4aba8ea4eee71e4daf", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.7310585533454672, "ground_truth": 0}, {"key": "ab3c9bac8bcfef89da719c4aba8ea4eee71e4daf", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.8816149059297573, "ground_truth": 0}, {"key": "ab3c9bac8bcfef89da719c4aba8ea4eee71e4daf", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.7154239842432742, "ground_truth": 0}, {"key": "eb8b1cf7cf4ab7ad23ef6094cfe69348563aecc8", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.16344543409494872, "ground_truth": 0}, {"key": "eb8b1cf7cf4ab7ad23ef6094cfe69348563aecc8", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.17217185696612827, "ground_truth": 0}, {"key": "eb8b1cf7cf4ab7ad23ef6094cfe69348563aecc8", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.17217184549026185, "ground_truth": 0}, {"key": "eb8b1cf7cf4ab7ad23ef6094cfe69348563aecc8", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.1859471984859567, "ground_truth": 0}, {"key": "eb8b1cf7cf4ab7ad23ef6094cfe69348563aecc8", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.15817435388900172, "ground_truth": 0}, {"key": "e944a5cbd4265e43f422c172b930a60b7de190cc", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.2958398676060045, "ground_truth": 0}, {"key": "e944a5cbd4265e43f422c172b930a60b7de190cc", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.44167301136106807, "ground_truth": 0}, {"key": "e944a5cbd4265e43f422c172b930a60b7de190cc", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.26588047563986544, "ground_truth": 0}, {"key": "e944a5cbd4265e43f422c172b930a60b7de190cc", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.12252321407534236, "ground_truth": 0}, {"key": "e944a5cbd4265e43f422c172b930a60b7de190cc", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.36296918862228983, "ground_truth": 0}, {"key": "ef96a6c54daaf4fef676a69305e26fa1d4788bdd", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.5117165859697274, "ground_truth": 0}, {"key": "ef96a6c54daaf4fef676a69305e26fa1d4788bdd", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.4765796581417898, "ground_truth": 0}, {"key": "ef96a6c54daaf4fef676a69305e26fa1d4788bdd", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.3090237044321397, "ground_truth": 0}, {"key": "ef96a6c54daaf4fef676a69305e26fa1d4788bdd", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.7233094638878266, "ground_truth": 0}, {"key": "ef96a6c54daaf4fef676a69305e26fa1d4788bdd", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.5273165186031075, "ground_truth": 0}, {"key": "d9ec8c3e50de1d5af4524c26c6819e17b64090aa", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.312370014392503, "ground_truth": 0}, {"key": "d9ec8c3e50de1d5af4524c26c6819e17b64090aa", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.4513265352136198, "ground_truth": 0}, {"key": "d9ec8c3e50de1d5af4524c26c6819e17b64090aa", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.14318769986331145, "ground_truth": 0}, {"key": "d9ec8c3e50de1d5af4524c26c6819e17b64090aa", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.3451052992060597, "ground_truth": 0}, {"key": "d9ec8c3e50de1d5af4524c26c6819e17b64090aa", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.35042137205037105, "ground_truth": 0}, {"key": "b6072611b97e8c19ba2d7e0dfce153f046dd629d", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.0994702110836636, "ground_truth": 0}, {"key": "b6072611b97e8c19ba2d7e0dfce153f046dd629d", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.1919327934243554, "ground_truth": 0}, {"key": "b6072611b97e8c19ba2d7e0dfce153f046dd629d", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.14318771711474687, "ground_truth": 0}, {"key": "b6072611b97e8c19ba2d7e0dfce153f046dd629d", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.0660853738375973, "ground_truth": 0}, {"key": "b6072611b97e8c19ba2d7e0dfce153f046dd629d", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.15610490471446323, "ground_truth": 0}, {"key": "2cf81cee664ebcb027a48259e34e512a79aceecb", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.567936585229975, "ground_truth": 0}, {"key": "2cf81cee664ebcb027a48259e34e512a79aceecb", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.4225046517012162, "ground_truth": 0}, {"key": "2cf81cee664ebcb027a48259e34e512a79aceecb", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.5409238470975937, "ground_truth": 0}, {"key": "2cf81cee664ebcb027a48259e34e512a79aceecb", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.38306418526887176, "ground_truth": 0}, {"key": "2cf81cee664ebcb027a48259e34e512a79aceecb", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.656658247089707, "ground_truth": 0}, {"key": "b037b44fc06a2d89d95dc7b4453b87371a34fe2f", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.37204877403609543, "ground_truth": 0}, {"key": "b037b44fc06a2d89d95dc7b4453b87371a34fe2f", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.8300437663836754, "ground_truth": 0}, {"key": "b037b44fc06a2d89d95dc7b4453b87371a34fe2f", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.4513265052456508, "ground_truth": 0}, {"key": "b037b44fc06a2d89d95dc7b4453b87371a34fe2f", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.6791786967206147, "ground_truth": 0}, {"key": "b037b44fc06a2d89d95dc7b4453b87371a34fe2f", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.794384948372473, "ground_truth": 0}, {"key": "b1ea881f21e2b58e247b5894d4f259cf86b4d1dd", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.5, "ground_truth": 0}, {"key": "b1ea881f21e2b58e247b5894d4f259cf86b4d1dd", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.20181322195378432, "ground_truth": 0}, {"key": "b1ea881f21e2b58e247b5894d4f259cf86b4d1dd", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.3960681670850274, "ground_truth": 0}, {"key": "b1ea881f21e2b58e247b5894d4f259cf86b4d1dd", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.1393963841510383, "ground_truth": 0}, {"key": "b1ea881f21e2b58e247b5894d4f259cf86b4d1dd", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.19314737506349552, "ground_truth": 0}, {"key": "d80e6a3be826df05df00a87f49cc426fd597f085", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.7106283020515941, "ground_truth": 0}, {"key": "d80e6a3be826df05df00a87f49cc426fd597f085", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.8984105447461438, "ground_truth": 0}, {"key": "d80e6a3be826df05df00a87f49cc426fd597f085", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.8397339688154783, "ground_truth": 0}, {"key": "d80e6a3be826df05df00a87f49cc426fd597f085", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.8221891242613815, "ground_truth": 0}, {"key": "d80e6a3be826df05df00a87f49cc426fd597f085", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.7461389929128941, "ground_truth": 0}, {"key": "05216d3837745866d393f0e07be7ba801dc330f6", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.4551986047691624, "ground_truth": 0}, {"key": "05216d3837745866d393f0e07be7ba801dc330f6", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.5467381382546018, "ground_truth": 0}, {"key": "05216d3837745866d393f0e07be7ba801dc330f6", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.299105182273212, "ground_truth": 0}, {"key": "05216d3837745866d393f0e07be7ba801dc330f6", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.4282334027536052, "ground_truth": 0}, {"key": "05216d3837745866d393f0e07be7ba801dc330f6", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.4746311904070297, "ground_truth": 0}, {"key": "a204e3551445183cf53ae355e532a2db731c0c30", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.17781087017225328, "ground_truth": 0}, {"key": "a204e3551445183cf53ae355e532a2db731c0c30", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.28776782404161433, "ground_truth": 0}, {"key": "a204e3551445183cf53ae355e532a2db731c0c30", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.2479874350672516, "ground_truth": 0}, {"key": "a204e3551445183cf53ae355e532a2db731c0c30", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.3208213050184915, "ground_truth": 0}, {"key": "a204e3551445183cf53ae355e532a2db731c0c30", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.35398629218651295, "ground_truth": 0}, {"key": "047e7bc4c7ea5f7df08d4efc443ac8a3479649f1", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.18952110276773165, "ground_truth": 0}, {"key": "047e7bc4c7ea5f7df08d4efc443ac8a3479649f1", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.35756752367199285, "ground_truth": 0}, {"key": "047e7bc4c7ea5f7df08d4efc443ac8a3479649f1", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.2146914110660816, "ground_truth": 0}, {"key": "047e7bc4c7ea5f7df08d4efc443ac8a3479649f1", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.27669052676547334, "ground_truth": 0}, {"key": "047e7bc4c7ea5f7df08d4efc443ac8a3479649f1", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.45132650202854563, "ground_truth": 0}, {"key": "dee467e11f253e70ec843c45fb373da06eace6be", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.4980468811764955, "ground_truth": 0}, {"key": "dee467e11f253e70ec843c45fb373da06eace6be", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.5755880409559051, "ground_truth": 0}, {"key": "dee467e11f253e70ec843c45fb373da06eace6be", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.5640984922288195, "ground_truth": 0}, {"key": "dee467e11f253e70ec843c45fb373da06eace6be", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.5794004030892803, "ground_truth": 0}, {"key": "dee467e11f253e70ec843c45fb373da06eace6be", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.43014735240906954, "ground_truth": 0}, {"key": "054891b9199a73152564cc5be925250ea282bb00", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.5506073498766239, "ground_truth": 0}, {"key": "054891b9199a73152564cc5be925250ea282bb00", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.5, "ground_truth": 0}, {"key": "054891b9199a73152564cc5be925250ea282bb00", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.3451052903021871, "ground_truth": 0}, {"key": "054891b9199a73152564cc5be925250ea282bb00", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.2407745882837708, "ground_truth": 0}, {"key": "054891b9199a73152564cc5be925250ea282bb00", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.2494472278379483, "ground_truth": 0}, {"key": "82a94cf607660eb67aac057e3f5028c4cae75abf", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.5331543977139961, "ground_truth": 0}, {"key": "82a94cf607660eb67aac057e3f5028c4cae75abf", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.7577943747075756, "ground_truth": 0}, {"key": "82a94cf607660eb67aac057e3f5028c4cae75abf", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.3812195672061173, "ground_truth": 0}, {"key": "82a94cf607660eb67aac057e3f5028c4cae75abf", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.46101679566829185, "ground_truth": 0}, {"key": "82a94cf607660eb67aac057e3f5028c4cae75abf", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.6688802690224142, "ground_truth": 0}, {"key": "58bf14c936eb7e9a6561599014fefd77ef6c457e", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.5506073639791214, "ground_truth": 0}, {"key": "58bf14c936eb7e9a6561599014fefd77ef6c457e", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.42632159016007604, "ground_truth": 0}, {"key": "58bf14c936eb7e9a6561599014fefd77ef6c457e", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.27202456635461314, "ground_truth": 0}, {"key": "58bf14c936eb7e9a6561599014fefd77ef6c457e", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.3415824937991159, "ground_truth": 0}, {"key": "58bf14c936eb7e9a6561599014fefd77ef6c457e", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.42632160131290486, "ground_truth": 0}, {"key": "5574fe023e3127f0c206ac89eb06abf5a7400438", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.09138210514545635, "ground_truth": 0}, {"key": "5574fe023e3127f0c206ac89eb06abf5a7400438", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.14608724505711815, "ground_truth": 0}, {"key": "5574fe023e3127f0c206ac89eb06abf5a7400438", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.16995623899441217, "ground_truth": 0}, {"key": "5574fe023e3127f0c206ac89eb06abf5a7400438", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.15304215878957084, "ground_truth": 0}, {"key": "5574fe023e3127f0c206ac89eb06abf5a7400438", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.2337063387889858, "ground_truth": 0}, {"key": "e88be1fa30cb6557d422788b5c469b7ba7ca8bfc", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.25386102158430046, "ground_truth": 0}, {"key": "e88be1fa30cb6557d422788b5c469b7ba7ca8bfc", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.4726834738195486, "ground_truth": 0}, {"key": "e88be1fa30cb6557d422788b5c469b7ba7ca8bfc", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.19930802026738423, "ground_truth": 0}, {"key": "e88be1fa30cb6557d422788b5c469b7ba7ca8bfc", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.4804786645909774, "ground_truth": 0}, {"key": "e88be1fa30cb6557d422788b5c469b7ba7ca8bfc", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.2909808543650256, "ground_truth": 0}, {"key": "62f05476ec5198ceb345ce4f45d7d0e70f499ad7", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.13206614147090126, "ground_truth": 0}, {"key": "62f05476ec5198ceb345ce4f45d7d0e70f499ad7", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.5156199155659886, "ground_truth": 0}, {"key": "62f05476ec5198ceb345ce4f45d7d0e70f499ad7", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.2568320030691205, "ground_truth": 0}, {"key": "62f05476ec5198ceb345ce4f45d7d0e70f499ad7", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.20434189666984393, "ground_truth": 0}, {"key": "62f05476ec5198ceb345ce4f45d7d0e70f499ad7", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.10230469917621185, "ground_truth": 0}, {"key": "8cc719f761556a81a71c2dd1b703749c2059df10", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.5736784375245779, "ground_truth": 0}, {"key": "8cc719f761556a81a71c2dd1b703749c2059df10", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.7956580935061436, "ground_truth": 0}, {"key": "8cc719f761556a81a71c2dd1b703749c2059df10", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.6224593317322384, "ground_truth": 0}, {"key": "8cc719f761556a81a71c2dd1b703749c2059df10", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.2509127797587542, "ground_truth": 0}, {"key": "8cc719f761556a81a71c2dd1b703749c2059df10", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.5525397132390871, "ground_truth": 0}, {"key": "2d89b0d0827a0a1e9e855de7717407cdff63b1f5", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.18359363036824372, "ground_truth": 0}, {"key": "2d89b0d0827a0a1e9e855de7717407cdff63b1f5", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.538983225542238, "ground_truth": 0}, {"key": "2d89b0d0827a0a1e9e855de7717407cdff63b1f5", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.3575675088314307, "ground_truth": 0}, {"key": "2d89b0d0827a0a1e9e855de7717407cdff63b1f5", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.4571367072790951, "ground_truth": 0}, {"key": "2d89b0d0827a0a1e9e855de7717407cdff63b1f5", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.39233681690587646, "ground_truth": 0}, {"key": "41431356e1e7c6f94057b262cd284987f9edb184", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.35220177359933724, "ground_truth": 0}, {"key": "41431356e1e7c6f94057b262cd284987f9edb184", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.2583259770790323, "ground_truth": 0}, {"key": "41431356e1e7c6f94057b262cd284987f9edb184", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.24220564150204987, "ground_truth": 0}, {"key": "41431356e1e7c6f94057b262cd284987f9edb184", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.5813030727720501, "ground_truth": 0}, {"key": "41431356e1e7c6f94057b262cd284987f9edb184", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.2407746038262031, "ground_truth": 0}, {"key": "50872fa30632af8f4c65fb9f952ea8e1b13043c9", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.5583269956903113, "ground_truth": 0}, {"key": "50872fa30632af8f4c65fb9f952ea8e1b13043c9", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.5078118637030034, "ground_truth": 0}, {"key": "50872fa30632af8f4c65fb9f952ea8e1b13043c9", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.33111973836156333, "ground_truth": 0}, {"key": "50872fa30632af8f4c65fb9f952ea8e1b13043c9", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.2450850174649016, "ground_truth": 0}, {"key": "50872fa30632af8f4c65fb9f952ea8e1b13043c9", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.5292633998470149, "ground_truth": 0}, {"key": "4a403faad8116c40f4cb960d3ffad081106341ad", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.46684562131192964, "ground_truth": 0}, {"key": "4a403faad8116c40f4cb960d3ffad081106341ad", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.7704647900067728, "ground_truth": 0}, {"key": "4a403faad8116c40f4cb960d3ffad081106341ad", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.49804688229316874, "ground_truth": 0}, {"key": "4a403faad8116c40f4cb960d3ffad081106341ad", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.6057990465829901, "ground_truth": 0}, {"key": "4a403faad8116c40f4cb960d3ffad081106341ad", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.5097643915204346, "ground_truth": 0}, {"key": "6f6964470c122807573653173b45b8e00bb59696", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.5926665864351015, "ground_truth": 0}, {"key": "6f6964470c122807573653173b45b8e00bb59696", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.6757646139013086, "ground_truth": 0}, {"key": "6f6964470c122807573653173b45b8e00bb59696", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.4707366130650502, "ground_truth": 0}, {"key": "6f6964470c122807573653173b45b8e00bb59696", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.5926665815940054, "ground_truth": 0}, {"key": "6f6964470c122807573653173b45b8e00bb59696", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.7416740279064064, "ground_truth": 0}, {"key": "75c6e27a38b72bb9f75fa2b8e45e933bae10dac5", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.5983121969601184, "ground_truth": 0}, {"key": "75c6e27a38b72bb9f75fa2b8e45e933bae10dac5", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.3702253820962791, "ground_truth": 0}, {"key": "75c6e27a38b72bb9f75fa2b8e45e933bae10dac5", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.5602526675768236, "ground_truth": 0}, {"key": "75c6e27a38b72bb9f75fa2b8e45e933bae10dac5", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.6740504725213431, "ground_truth": 0}, {"key": "75c6e27a38b72bb9f75fa2b8e45e933bae10dac5", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.7217432061340591, "ground_truth": 0}, {"key": "9aa6463127d1efcba4403a185b29849a3688db8d", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.6388352747377511, "ground_truth": 0}, {"key": "9aa6463127d1efcba4403a185b29849a3688db8d", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.31405054722468, "ground_truth": 0}, {"key": "9aa6463127d1efcba4403a185b29849a3688db8d", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.27512971775649364, "ground_truth": 0}, {"key": "9aa6463127d1efcba4403a185b29849a3688db8d", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.43974732921865933, "ground_truth": 0}, {"key": "9aa6463127d1efcba4403a185b29849a3688db8d", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.20689405736739205, "ground_truth": 0}, {"key": "97eda06b374f07cd9495962465775bde7d44da31", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.46879061946652695, "ground_truth": 0}, {"key": "97eda06b374f07cd9495962465775bde7d44da31", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.5794004228408522, "ground_truth": 0}, {"key": "97eda06b374f07cd9495962465775bde7d44da31", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.3665897370345493, "ground_truth": 0}, {"key": "97eda06b374f07cd9495962465775bde7d44da31", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.5117165842751672, "ground_truth": 0}, {"key": "97eda06b374f07cd9495962465775bde7d44da31", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.23934933660694235, "ground_truth": 0}, {"key": "99a6049d67c1cee35f9703ccb8e6f62a4928295a", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.20561503599839315, "ground_truth": 0}, {"key": "99a6049d67c1cee35f9703ccb8e6f62a4928295a", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.2704802259414377, "ground_truth": 0}, {"key": "99a6049d67c1cee35f9703ccb8e6f62a4928295a", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.12940272769858285, "ground_truth": 0}, {"key": "99a6049d67c1cee35f9703ccb8e6f62a4928295a", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.2323101457820331, "ground_truth": 0}, {"key": "99a6049d67c1cee35f9703ccb8e6f62a4928295a", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.18010665981894972, "ground_truth": 0}, {"key": "adcb3e7b4bef0f9efe7a838b56131ca99b587743", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.12252321431906961, "ground_truth": 0}, {"key": "adcb3e7b4bef0f9efe7a838b56131ca99b587743", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.19072402930753984, "ground_truth": 0}, {"key": "adcb3e7b4bef0f9efe7a838b56131ca99b587743", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.1267851640586233, "ground_truth": 0}, {"key": "adcb3e7b4bef0f9efe7a838b56131ca99b587743", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.08269734287573431, "ground_truth": 0}, {"key": "adcb3e7b4bef0f9efe7a838b56131ca99b587743", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.24798744355487107, "ground_truth": 0}, {"key": "bf7cc4e7872b7471a8ef858b8aa45eca090171da", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.16238002530012577, "ground_truth": 0}, {"key": "bf7cc4e7872b7471a8ef858b8aa45eca090171da", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.17441027012509994, "ground_truth": 0}, {"key": "bf7cc4e7872b7471a8ef858b8aa45eca090171da", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.12168575406438469, "ground_truth": 0}, {"key": "bf7cc4e7872b7471a8ef858b8aa45eca090171da", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.23510839278432244, "ground_truth": 0}, {"key": "bf7cc4e7872b7471a8ef858b8aa45eca090171da", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.14033624149918192, "ground_truth": 0}, {"key": "62785b99e4007fad95ce55d427046e14aef476a4", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.32594953050197545, "ground_truth": 0}, {"key": "62785b99e4007fad95ce55d427046e14aef476a4", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.3849121670073784, "ground_truth": 0}, {"key": "62785b99e4007fad95ce55d427046e14aef476a4", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.12678517357661578, "ground_truth": 0}, {"key": "62785b99e4007fad95ce55d427046e14aef476a4", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.1311732199617979, "ground_truth": 0}, {"key": "62785b99e4007fad95ce55d427046e14aef476a4", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.14608724021237468, "ground_truth": 0}, {"key": "62fcd4ca096a182c292ae3609444bbc7af15eab6", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.6842640166052567, "ground_truth": 0}, {"key": "62fcd4ca096a182c292ae3609444bbc7af15eab6", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.29259530771094117, "ground_truth": 0}, {"key": "62fcd4ca096a182c292ae3609444bbc7af15eab6", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.6584175005372521, "ground_truth": 0}, {"key": "62fcd4ca096a182c292ae3609444bbc7af15eab6", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.5525397086385564, "ground_truth": 0}, {"key": "62fcd4ca096a182c292ae3609444bbc7af15eab6", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.2958398579728035, "ground_truth": 0}, {"key": "afdbd1bc7c79a936601b3c6cae4622464641d3a5", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.29583986783370925, "ground_truth": 0}, {"key": "afdbd1bc7c79a936601b3c6cae4622464641d3a5", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.4282334071454869, "ground_truth": 0}, {"key": "afdbd1bc7c79a936601b3c6cae4622464641d3a5", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.4016877966455804, "ground_truth": 0}, {"key": "afdbd1bc7c79a936601b3c6cae4622464641d3a5", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.4882834002502252, "ground_truth": 0}, {"key": "afdbd1bc7c79a936601b3c6cae4622464641d3a5", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.4726834758480781, "ground_truth": 0}, {"key": "2a2a0fd7b85ec6f9145761795bae420d7eb84f44", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.41869689220180906, "ground_truth": 0}, {"key": "2a2a0fd7b85ec6f9145761795bae420d7eb84f44", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.43014731948069895, "ground_truth": 0}, {"key": "2a2a0fd7b85ec6f9145761795bae420d7eb84f44", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.4474602743114581, "ground_truth": 0}, {"key": "2a2a0fd7b85ec6f9145761795bae420d7eb84f44", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.3106943407389507, "ground_truth": 0}, {"key": "2a2a0fd7b85ec6f9145761795bae420d7eb84f44", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.37754065007153603, "ground_truth": 0}, {"key": "f3d07208d0059d738fc7788a4ce813309b677d7b", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.3998116446015195, "ground_truth": 0}, {"key": "f3d07208d0059d738fc7788a4ce813309b677d7b", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.24220561357037693, "ground_truth": 0}, {"key": "f3d07208d0059d738fc7788a4ce813309b677d7b", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.12852513544989763, "ground_truth": 0}, {"key": "f3d07208d0059d738fc7788a4ce813309b677d7b", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.21469142492252624, "ground_truth": 0}, {"key": "f3d07208d0059d738fc7788a4ce813309b677d7b", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.17895590413436593, "ground_truth": 0}, {"key": "2b8840981769a4a8f93d2e82e609ab169165cd3c", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.14804718530773125, "ground_truth": 0}, {"key": "2b8840981769a4a8f93d2e82e609ab169165cd3c", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.1183850985910077, "ground_truth": 0}, {"key": "2b8840981769a4a8f93d2e82e609ab169165cd3c", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.20946969769526808, "ground_truth": 0}, {"key": "2b8840981769a4a8f93d2e82e609ab169165cd3c", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.26284184564127855, "ground_truth": 0}, {"key": "2b8840981769a4a8f93d2e82e609ab169165cd3c", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.294214963169622, "ground_truth": 0}, {"key": "4b23ce1db7253bf118b493c9bea7d6899012cc88", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.17895589633946837, "ground_truth": 0}, {"key": "4b23ce1db7253bf118b493c9bea7d6899012cc88", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.15304215716012445, "ground_truth": 0}, {"key": "4b23ce1db7253bf118b493c9bea7d6899012cc88", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.14511536534342756, "ground_truth": 0}, {"key": "4b23ce1db7253bf118b493c9bea7d6899012cc88", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.1329642373628789, "ground_truth": 0}, {"key": "4b23ce1db7253bf118b493c9bea7d6899012cc88", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.1634454349260164, "ground_truth": 0}, {"key": "c220780a60f76cdd1f6fd9a84abac736c3ee8ace", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.40544872030417245, "ground_truth": 0}, {"key": "c220780a60f76cdd1f6fd9a84abac736c3ee8ace", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.3486451275895983, "ground_truth": 0}, {"key": "c220780a60f76cdd1f6fd9a84abac736c3ee8ace", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.12506538455046665, "ground_truth": 0}, {"key": "c220780a60f76cdd1f6fd9a84abac736c3ee8ace", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.289371712070244, "ground_truth": 0}, {"key": "c220780a60f76cdd1f6fd9a84abac736c3ee8ace", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.3023910913803466, "ground_truth": 0}, {"key": "9c7687a36469fc0e2203edb31f303274a611fb12", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.0742313675927833, "ground_truth": 0}, {"key": "9c7687a36469fc0e2203edb31f303274a611fb12", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.4571367345269548, "ground_truth": 0}, {"key": "9c7687a36469fc0e2203edb31f303274a611fb12", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.11838509631983685, "ground_truth": 0}, {"key": "9c7687a36469fc0e2203edb31f303274a611fb12", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.2628418435872695, "ground_truth": 0}, {"key": "9c7687a36469fc0e2203edb31f303274a611fb12", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.2509127955350636, "ground_truth": 0}, {"key": "8ab7fe3b19bb45c977cb74ed675579a20611ad9b", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.6132365661928068, "ground_truth": 0}, {"key": "8ab7fe3b19bb45c977cb74ed675579a20611ad9b", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.6477982131048975, "ground_truth": 0}, {"key": "8ab7fe3b19bb45c977cb74ed675579a20611ad9b", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.390475842201753, "ground_truth": 0}, {"key": "8ab7fe3b19bb45c977cb74ed675579a20611ad9b", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.27982848940358923, "ground_truth": 0}, {"key": "8ab7fe3b19bb45c977cb74ed675579a20611ad9b", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.5926666085075369, "ground_truth": 0}, {"key": "dfedf6786976733d8e33e7848ea8a7aa735bbcab", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.2798285118507511, "ground_truth": 0}, {"key": "dfedf6786976733d8e33e7848ea8a7aa735bbcab", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.26435836896377857, "ground_truth": 0}, {"key": "dfedf6786976733d8e33e7848ea8a7aa735bbcab", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.2674081788091925, "ground_truth": 0}, {"key": "dfedf6786976733d8e33e7848ea8a7aa735bbcab", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.20434189383893095, "ground_truth": 0}, {"key": "dfedf6786976733d8e33e7848ea8a7aa735bbcab", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.24364244441554453, "ground_truth": 0}, {"key": "825f58580dd78cdcc7fbc10a00807e043c7b4468", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.5602526819061053, "ground_truth": 0}, {"key": "825f58580dd78cdcc7fbc10a00807e043c7b4468", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.594551263650225, "ground_truth": 0}, {"key": "825f58580dd78cdcc7fbc10a00807e043c7b4468", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.7648916146110392, "ground_truth": 0}, {"key": "825f58580dd78cdcc7fbc10a00807e043c7b4468", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.2782567943085928, "ground_truth": 0}, {"key": "825f58580dd78cdcc7fbc10a00807e043c7b4468", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.810478897919802, "ground_truth": 0}, {"key": "8bd6dc9f3ebb23fe20f74c1956184064b5b95509", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.18832397836514997, "ground_truth": 0}, {"key": "8bd6dc9f3ebb23fe20f74c1956184064b5b95509", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.4513265352136198, "ground_truth": 0}, {"key": "8bd6dc9f3ebb23fe20f74c1956184064b5b95509", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.14128141924561852, "ground_truth": 0}, {"key": "8bd6dc9f3ebb23fe20f74c1956184064b5b95509", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.2173375127328482, "ground_truth": 0}, {"key": "8bd6dc9f3ebb23fe20f74c1956184064b5b95509", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.24653334572568159, "ground_truth": 0}, {"key": "a7f6d4487a3ba7c4fc29e9b410820891f4c4f086", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.5679366243207714, "ground_truth": 0}, {"key": "a7f6d4487a3ba7c4fc29e9b410820891f4c4f086", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.5851011655089992, "ground_truth": 0}, {"key": "a7f6d4487a3ba7c4fc29e9b410820891f4c4f086", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.6959583412746045, "ground_truth": 0}, {"key": "a7f6d4487a3ba7c4fc29e9b410820891f4c4f086", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.5039061408130205, "ground_truth": 0}, {"key": "a7f6d4487a3ba7c4fc29e9b410820891f4c4f086", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.5312093760495042, "ground_truth": 0}, {"key": "b27ad09982665477dacdb7d06a33134bf064dd8d", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.09670578670901599, "ground_truth": 0}, {"key": "b27ad09982665477dacdb7d06a33134bf064dd8d", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.19682619990606026, "ground_truth": 0}, {"key": "b27ad09982665477dacdb7d06a33134bf064dd8d", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.16667540555777122, "ground_truth": 0}, {"key": "b27ad09982665477dacdb7d06a33134bf064dd8d", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.19072402730381557, "ground_truth": 0}, {"key": "b27ad09982665477dacdb7d06a33134bf064dd8d", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.1422318951540044, "ground_truth": 0}, {"key": "905891c3a21e76ad63d63dfe55e569a4cab25583", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.18242553493737748, "ground_truth": 0}, {"key": "905891c3a21e76ad63d63dfe55e569a4cab25583", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.25982564762951826, "ground_truth": 0}, {"key": "905891c3a21e76ad63d63dfe55e569a4cab25583", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.35220176237067763, "ground_truth": 0}, {"key": "905891c3a21e76ad63d63dfe55e569a4cab25583", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.3702253852501514, "ground_truth": 0}, {"key": "905891c3a21e76ad63d63dfe55e569a4cab25583", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.40922079216026574, "ground_truth": 0}, {"key": "626460b8ec58252c82ff5513aa754190332780aa", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.4263215746814654, "ground_truth": 0}, {"key": "626460b8ec58252c82ff5513aa754190332780aa", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.5832033537877693, "ground_truth": 0}, {"key": "626460b8ec58252c82ff5513aa754190332780aa", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.2925953145676291, "ground_truth": 0}, {"key": "626460b8ec58252c82ff5513aa754190332780aa", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.6513548519904381, "ground_truth": 0}, {"key": "626460b8ec58252c82ff5513aa754190332780aa", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.6774740106844765, "ground_truth": 0}, {"key": "31d0ed7b1b8f65c6479fb35683d72de21d70796a", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.5851011791184632, "ground_truth": 0}, {"key": "31d0ed7b1b8f65c6479fb35683d72de21d70796a", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.6477982076127755, "ground_truth": 0}, {"key": "31d0ed7b1b8f65c6479fb35683d72de21d70796a", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.7310585529213309, "ground_truth": 0}, {"key": "31d0ed7b1b8f65c6479fb35683d72de21d70796a", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.5253688192493073, "ground_truth": 0}, {"key": "31d0ed7b1b8f65c6479fb35683d72de21d70796a", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.743167998382716, "ground_truth": 0}, {"key": "b03ee4df6492038d0a1d99a1717d8ad8ccc06db3", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.6584175072523261, "ground_truth": 0}, {"key": "b03ee4df6492038d0a1d99a1717d8ad8ccc06db3", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.5926666083070231, "ground_truth": 0}, {"key": "b03ee4df6492038d0a1d99a1717d8ad8ccc06db3", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.5964331491256935, "ground_truth": 0}, {"key": "b03ee4df6492038d0a1d99a1717d8ad8ccc06db3", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.6095241633542876, "ground_truth": 0}, {"key": "b03ee4df6492038d0a1d99a1717d8ad8ccc06db3", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.48047869063564425, "ground_truth": 0}, {"key": "ad9abc78fb2de88267b854f2aed110e2a5b8c3f1", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.6619228707488852, "ground_truth": 0}, {"key": "ad9abc78fb2de88267b854f2aed110e2a5b8c3f1", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.7813306335721176, "ground_truth": 0}, {"key": "ad9abc78fb2de88267b854f2aed110e2a5b8c3f1", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.679178692168737, "ground_truth": 0}, {"key": "ad9abc78fb2de88267b854f2aed110e2a5b8c3f1", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.6654105629803302, "ground_truth": 0}, {"key": "ad9abc78fb2de88267b854f2aed110e2a5b8c3f1", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.40733340979722216, "ground_truth": 0}, {"key": "75cc16a7ba1970ba791da4ba43e6220f37f47697", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.6261241800737132, "ground_truth": 0}, {"key": "75cc16a7ba1970ba791da4ba43e6220f37f47697", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.618780442020324, "ground_truth": 0}, {"key": "75cc16a7ba1970ba791da4ba43e6220f37f47697", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.4726834774685899, "ground_truth": 0}, {"key": "75cc16a7ba1970ba791da4ba43e6220f37f47697", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.7248702703184153, "ground_truth": 0}, {"key": "75cc16a7ba1970ba791da4ba43e6220f37f47697", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.7201715004471446, "ground_truth": 0}, {"key": "fe9d63d0ed719a42735cadaf10e76416545f680c", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.4843800727681256, "ground_truth": 0}, {"key": "fe9d63d0ed719a42735cadaf10e76416545f680c", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.2553436492618334, "ground_truth": 0}, {"key": "fe9d63d0ed719a42735cadaf10e76416545f680c", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.4980468800556615, "ground_truth": 0}, {"key": "fe9d63d0ed719a42735cadaf10e76416545f680c", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.41489884056635484, "ground_truth": 0}, {"key": "fe9d63d0ed719a42735cadaf10e76416545f680c", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.41679665302935104, "ground_truth": 0}, {"key": "1744093a3fea8b8de0777b1a228c3ba3e515d48e", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.6566582627229567, "ground_truth": 0}, {"key": "1744093a3fea8b8de0777b1a228c3ba3e515d48e", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.7786493032159607, "ground_truth": 0}, {"key": "1744093a3fea8b8de0777b1a228c3ba3e515d48e", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.6279512115314089, "ground_truth": 0}, {"key": "1744093a3fea8b8de0777b1a228c3ba3e515d48e", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.4359015370740707, "ground_truth": 0}, {"key": "1744093a3fea8b8de0777b1a228c3ba3e515d48e", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.6584175086614943, "ground_truth": 0}, {"key": "4929479f70e89deb22539e7d2caa6c33bbb0a14f", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.6370308126660211, "ground_truth": 0}, {"key": "4929479f70e89deb22539e7d2caa6c33bbb0a14f", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.38306418827265837, "ground_truth": 0}, {"key": "4929479f70e89deb22539e7d2caa6c33bbb0a14f", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.07640767746379946, "ground_truth": 0}, {"key": "4929479f70e89deb22539e7d2caa6c33bbb0a14f", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.3276683008673148, "ground_truth": 0}, {"key": "4929479f70e89deb22539e7d2caa6c33bbb0a14f", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.3593641437494385, "ground_truth": 0}, {"key": "4dd3bb1fe7a5b0d42f0df8d9e62b81c673475420", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.17667161139931073, "ground_truth": 0}, {"key": "4dd3bb1fe7a5b0d42f0df8d9e62b81c673475420", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.5097643694503714, "ground_truth": 0}, {"key": "4dd3bb1fe7a5b0d42f0df8d9e62b81c673475420", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.4785288322372605, "ground_truth": 0}, {"key": "4dd3bb1fe7a5b0d42f0df8d9e62b81c673475420", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.2173375195239957, "ground_truth": 0}, {"key": "4dd3bb1fe7a5b0d42f0df8d9e62b81c673475420", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.13477591218752447, "ground_truth": 0}, {"key": "32f0c7b0845e88c7ff34bb9d358a86e029dc2261", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.361164719124416, "ground_truth": 0}, {"key": "32f0c7b0845e88c7ff34bb9d358a86e029dc2261", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.6477982131048975, "ground_truth": 0}, {"key": "32f0c7b0845e88c7ff34bb9d358a86e029dc2261", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.47268349424060757, "ground_truth": 0}, {"key": "32f0c7b0845e88c7ff34bb9d358a86e029dc2261", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.1980641675971156, "ground_truth": 0}, {"key": "32f0c7b0845e88c7ff34bb9d358a86e029dc2261", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.5926666085075369, "ground_truth": 0}, {"key": "607ce3caeeac56d7c4250aaa161871535cd1251e", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.2628418485189759, "ground_truth": 0}, {"key": "607ce3caeeac56d7c4250aaa161871535cd1251e", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.4282334043009297, "ground_truth": 0}, {"key": "607ce3caeeac56d7c4250aaa161871535cd1251e", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.11201595644809383, "ground_truth": 0}, {"key": "607ce3caeeac56d7c4250aaa161871535cd1251e", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.2720245695864377, "ground_truth": 0}, {"key": "607ce3caeeac56d7c4250aaa161871535cd1251e", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.390475843137409, "ground_truth": 0}, {"key": "7fb19f75d5d3feefeababf62d2ac91bf684a8038", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.6926419855586446, "ground_truth": 0}, {"key": "7fb19f75d5d3feefeababf62d2ac91bf684a8038", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.5525397070288831, "ground_truth": 0}, {"key": "7fb19f75d5d3feefeababf62d2ac91bf684a8038", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.4843800648541743, "ground_truth": 0}, {"key": "7fb19f75d5d3feefeababf62d2ac91bf684a8038", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.6150878532014924, "ground_truth": 0}, {"key": "7fb19f75d5d3feefeababf62d2ac91bf684a8038", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.7154239842765513, "ground_truth": 0}, {"key": "4a70f83728ee66801be719df00060cda4c25817f", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.3575675355589947, "ground_truth": 0}, {"key": "4a70f83728ee66801be719df00060cda4c25817f", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.1375324735432527, "ground_truth": 0}, {"key": "4a70f83728ee66801be719df00060cda4c25817f", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.4205996076616903, "ground_truth": 0}, {"key": "4a70f83728ee66801be719df00060cda4c25817f", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.18359363169520415, "ground_truth": 0}, {"key": "4a70f83728ee66801be719df00060cda4c25817f", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.394200938650682, "ground_truth": 0}, {"key": "dcfc0e6ff732124026991e89d50727876f50351f", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.20817894146677354, "ground_truth": 0}, {"key": "dcfc0e6ff732124026991e89d50727876f50351f", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.4111108650381633, "ground_truth": 0}, {"key": "dcfc0e6ff732124026991e89d50727876f50351f", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.3665897553810254, "ground_truth": 0}, {"key": "dcfc0e6ff732124026991e89d50727876f50351f", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.21076632531740733, "ground_truth": 0}, {"key": "dcfc0e6ff732124026991e89d50727876f50351f", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.224055453147712, "ground_truth": 0}, {"key": "ace7f6d9e984397bda16bf441019f1584f036b2a", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.9019206800292207, "ground_truth": 0}, {"key": "ace7f6d9e984397bda16bf441019f1584f036b2a", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.9224823426531741, "ground_truth": 0}, {"key": "ace7f6d9e984397bda16bf441019f1584f036b2a", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.9585377257688986, "ground_truth": 0}, {"key": "ace7f6d9e984397bda16bf441019f1584f036b2a", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.9764905469679475, "ground_truth": 0}, {"key": "ace7f6d9e984397bda16bf441019f1584f036b2a", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.8848377687065851, "ground_truth": 0}, {"key": "6f12c9d47e70bfa86d72685d018ddd1161157e8e", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.39793841818355313, "ground_truth": 0}, {"key": "6f12c9d47e70bfa86d72685d018ddd1161157e8e", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.4902356376048684, "ground_truth": 0}, {"key": "6f12c9d47e70bfa86d72685d018ddd1161157e8e", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.40356688251457845, "ground_truth": 0}, {"key": "6f12c9d47e70bfa86d72685d018ddd1161157e8e", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.2043419149182204, "ground_truth": 0}, {"key": "6f12c9d47e70bfa86d72685d018ddd1161157e8e", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.29421496488112936, "ground_truth": 0}, {"key": "b32b72e5cf9e133e5be33eccbb2dc9ab5578ae84", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.16238003621773858, "ground_truth": 0}, {"key": "b32b72e5cf9e133e5be33eccbb2dc9ab5578ae84", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.13846178853740593, "ground_truth": 0}, {"key": "b32b72e5cf9e133e5be33eccbb2dc9ab5578ae84", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.26133091455138735, "ground_truth": 0}, {"key": "b32b72e5cf9e133e5be33eccbb2dc9ab5578ae84", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.3998116676790591, "ground_truth": 0}, {"key": "b32b72e5cf9e133e5be33eccbb2dc9ab5578ae84", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.3433417450592978, "ground_truth": 0}, {"key": "0ae5e35dc2844afc251d082d8d5ef4be8edce58c", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.33982762234857966, "ground_truth": 0}, {"key": "0ae5e35dc2844afc251d082d8d5ef4be8edce58c", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.6424324688485477, "ground_truth": 0}, {"key": "0ae5e35dc2844afc251d082d8d5ef4be8edce58c", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.6039318427296219, "ground_truth": 0}, {"key": "0ae5e35dc2844afc251d082d8d5ef4be8edce58c", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.4726834793567411, "ground_truth": 0}, {"key": "0ae5e35dc2844afc251d082d8d5ef4be8edce58c", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.6039318313446776, "ground_truth": 0}, {"key": "ffb817ce85d7c19720ebbf0b43b01d0da61e9c06", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.3451052982650967, "ground_truth": 0}, {"key": "ffb817ce85d7c19720ebbf0b43b01d0da61e9c06", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.5428632644488439, "ground_truth": 0}, {"key": "ffb817ce85d7c19720ebbf0b43b01d0da61e9c06", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.3593641427141407, "ground_truth": 0}, {"key": "ffb817ce85d7c19720ebbf0b43b01d0da61e9c06", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.3191213971932776, "ground_truth": 0}, {"key": "ffb817ce85d7c19720ebbf0b43b01d0da61e9c06", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.21866936865073305, "ground_truth": 0}, {"key": "9bfd6a5beb4e8dec59ba6d805dc9349a401da51d", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.27825677753836997, "ground_truth": 0}, {"key": "9bfd6a5beb4e8dec59ba6d805dc9349a401da51d", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.4148988296184205, "ground_truth": 0}, {"key": "9bfd6a5beb4e8dec59ba6d805dc9349a401da51d", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.329391731116368, "ground_truth": 0}, {"key": "9bfd6a5beb4e8dec59ba6d805dc9349a401da51d", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.37022542320863944, "ground_truth": 0}, {"key": "9bfd6a5beb4e8dec59ba6d805dc9349a401da51d", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.2295351981796532, "ground_truth": 0}, {"key": "dc7f4527bf654918c7a4bb19179949ecd5982c0f", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.35756752343060616, "ground_truth": 0}, {"key": "dc7f4527bf654918c7a4bb19179949ecd5982c0f", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.3757064857528576, "ground_truth": 0}, {"key": "dc7f4527bf654918c7a4bb19179949ecd5982c0f", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.20307462320472439, "ground_truth": 0}, {"key": "dc7f4527bf654918c7a4bb19179949ecd5982c0f", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.3242353897100328, "ground_truth": 0}, {"key": "dc7f4527bf654918c7a4bb19179949ecd5982c0f", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.5292633960311804, "ground_truth": 0}, {"key": "c60e77736087bc85b372a28b4724aae6dcf0b052", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.08151975520056007, "ground_truth": 0}, {"key": "c60e77736087bc85b372a28b4724aae6dcf0b052", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.2628418426604346, "ground_truth": 0}, {"key": "c60e77736087bc85b372a28b4724aae6dcf0b052", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.1634454425350516, "ground_truth": 0}, {"key": "c60e77736087bc85b372a28b4724aae6dcf0b052", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.1233656096093236, "ground_truth": 0}, {"key": "c60e77736087bc85b372a28b4724aae6dcf0b052", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.15713685827030052, "ground_truth": 0}, {"key": "e0953e2de7cf286ac1d87a41c62e37f21b7c7564", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.6531269111422352, "ground_truth": 0}, {"key": "e0953e2de7cf286ac1d87a41c62e37f21b7c7564", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.37022536770694386, "ground_truth": 0}, {"key": "e0953e2de7cf286ac1d87a41c62e37f21b7c7564", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.674050465492782, "ground_truth": 0}, {"key": "e0953e2de7cf286ac1d87a41c62e37f21b7c7564", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.6279511974714235, "ground_truth": 0}, {"key": "e0953e2de7cf286ac1d87a41c62e37f21b7c7564", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.7154239988843818, "ground_truth": 0}, {"key": "8b6f228661fd5f3170dc2c2e6b353e1d6c3859ec", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.22135069699932053, "ground_truth": 0}, {"key": "8b6f228661fd5f3170dc2c2e6b353e1d6c3859ec", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.44746031383633494, "ground_truth": 0}, {"key": "8b6f228661fd5f3170dc2c2e6b353e1d6c3859ec", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.5467381250733526, "ground_truth": 0}, {"key": "8b6f228661fd5f3170dc2c2e6b353e1d6c3859ec", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.22541661157374845, "ground_truth": 0}, {"key": "8b6f228661fd5f3170dc2c2e6b353e1d6c3859ec", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.43974733108221714, "ground_truth": 0}, {"key": "2f482e021caf07e2f07baf111c36d1587758f188", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.14706452867910053, "ground_truth": 0}, {"key": "2f482e021caf07e2f07baf111c36d1587758f188", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.18010666172820716, "ground_truth": 0}, {"key": "2f482e021caf07e2f07baf111c36d1587758f188", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.2465333463005727, "ground_truth": 0}, {"key": "2f482e021caf07e2f07baf111c36d1587758f188", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.2295352071332431, "ground_truth": 0}, {"key": "2f482e021caf07e2f07baf111c36d1587758f188", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.1710611827650935, "ground_truth": 0}, {"key": "dc8ce4207b91a323bf6e2fbab889efeed22aa428", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.17781088209436358, "ground_truth": 0}, {"key": "dc8ce4207b91a323bf6e2fbab889efeed22aa428", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.30239109341308895, "ground_truth": 0}, {"key": "dc8ce4207b91a323bf6e2fbab889efeed22aa428", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.19436782628862045, "ground_truth": 0}, {"key": "dc8ce4207b91a323bf6e2fbab889efeed22aa428", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.214691414526066, "ground_truth": 0}, {"key": "dc8ce4207b91a323bf6e2fbab889efeed22aa428", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.19682621603097053, "ground_truth": 0}, {"key": "22a9005fe99c5dd536a4f41de4eb59d4f633ef9e", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.2509127811670081, "ground_truth": 0}, {"key": "22a9005fe99c5dd536a4f41de4eb59d4f633ef9e", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.7786492953623261, "ground_truth": 0}, {"key": "22a9005fe99c5dd536a4f41de4eb59d4f633ef9e", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.6132365389266154, "ground_truth": 0}, {"key": "22a9005fe99c5dd536a4f41de4eb59d4f633ef9e", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.486331489316365, "ground_truth": 0}, {"key": "22a9005fe99c5dd536a4f41de4eb59d4f633ef9e", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.7563575624300931, "ground_truth": 0}, {"key": "1b00b2d2edef396855ad392f08a6e74550af569b", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.33633103841635464, "ground_truth": 0}, {"key": "1b00b2d2edef396855ad392f08a6e74550af569b", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.3720488050289995, "ground_truth": 0}, {"key": "1b00b2d2edef396855ad392f08a6e74550af569b", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.2720245647045461, "ground_truth": 0}, {"key": "1b00b2d2edef396855ad392f08a6e74550af569b", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.26133091844469014, "ground_truth": 0}, {"key": "1b00b2d2edef396855ad392f08a6e74550af569b", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.31069437966243646, "ground_truth": 0}, {"key": "9b43472077873c45e7f278418885ad028eb993e3", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.13296423820009162, "ground_truth": 0}, {"key": "9b43472077873c45e7f278418885ad028eb993e3", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.14223188856631508, "ground_truth": 0}, {"key": "9b43472077873c45e7f278418885ad028eb993e3", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.17441026938780996, "ground_truth": 0}, {"key": "9b43472077873c45e7f278418885ad028eb993e3", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.14033624870474515, "ground_truth": 0}, {"key": "9b43472077873c45e7f278418885ad028eb993e3", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.11516222585237919, "ground_truth": 0}, {"key": "281347d0e99bc099d6991a6a60e30dc13d558216", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.4416729901883989, "ground_truth": 0}, {"key": "281347d0e99bc099d6991a6a60e30dc13d558216", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.4824291483732586, "ground_truth": 0}, {"key": "281347d0e99bc099d6991a6a60e30dc13d558216", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.5640984699427396, "ground_truth": 0}, {"key": "281347d0e99bc099d6991a6a60e30dc13d558216", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.42823337753339047, "ground_truth": 0}, {"key": "281347d0e99bc099d6991a6a60e30dc13d558216", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.4225046571496538, "ground_truth": 0}, {"key": "703d248cce913a6036347aabd2ba011a7f660bf4", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.3073580134080235, "ground_truth": 0}, {"key": "703d248cce913a6036347aabd2ba011a7f660bf4", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.25386101917689363, "ground_truth": 0}, {"key": "703d248cce913a6036347aabd2ba011a7f660bf4", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.3208213225190268, "ground_truth": 0}, {"key": "703d248cce913a6036347aabd2ba011a7f660bf4", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.3702253894152028, "ground_truth": 0}, {"key": "703d248cce913a6036347aabd2ba011a7f660bf4", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.21076629604774522, "ground_truth": 0}, {"key": "517b86691dda04f41123354c1b7a7bfe1290eadc", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.279828495261844, "ground_truth": 0}, {"key": "517b86691dda04f41123354c1b7a7bfe1290eadc", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.22270014773202554, "ground_truth": 0}, {"key": "517b86691dda04f41123354c1b7a7bfe1290eadc", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.38676343098709726, "ground_truth": 0}, {"key": "517b86691dda04f41123354c1b7a7bfe1290eadc", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.15610489954103793, "ground_truth": 0}, {"key": "517b86691dda04f41123354c1b7a7bfe1290eadc", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.3738758290108561, "ground_truth": 0}, {"key": "7b361feeebfb078b80831d40d2ad8640c361e049", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.37570647969757, "ground_truth": 0}, {"key": "7b361feeebfb078b80831d40d2ad8640c361e049", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.6039318285663172, "ground_truth": 0}, {"key": "7b361feeebfb078b80831d40d2ad8640c361e049", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.4668455996781299, "ground_truth": 0}, {"key": "7b361feeebfb078b80831d40d2ad8640c361e049", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.2782567959073351, "ground_truth": 0}, {"key": "7b361feeebfb078b80831d40d2ad8640c361e049", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.47657965429836335, "ground_truth": 0}, {"key": "7d8e196095e4561ee4f01c650101f5591fce4a8d", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.049222115830937586, "ground_truth": 0}, {"key": "7d8e196095e4561ee4f01c650101f5591fce4a8d", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.07159119773893777, "ground_truth": 0}, {"key": "7d8e196095e4561ee4f01c650101f5591fce4a8d", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.33982762354924867, "ground_truth": 0}, {"key": "7d8e196095e4561ee4f01c650101f5591fce4a8d", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.131173232245186, "ground_truth": 0}, {"key": "7d8e196095e4561ee4f01c650101f5591fce4a8d", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.3665897355321262, "ground_truth": 0}, {"key": "ae03390949407f55c8d8f794896af3020d180b12", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.18594720071829798, "ground_truth": 0}, {"key": "ae03390949407f55c8d8f794896af3020d180b12", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.23510838505778212, "ground_truth": 0}, {"key": "ae03390949407f55c8d8f794896af3020d180b12", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.2479874410741233, "ground_truth": 0}, {"key": "ae03390949407f55c8d8f794896af3020d180b12", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.14511535335947334, "ground_truth": 0}, {"key": "ae03390949407f55c8d8f794896af3020d180b12", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.2133771740309577, "ground_truth": 0}, {"key": "4160464d3fcba547cb1664e54ce51ad06f78b773", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.6406358635196537, "ground_truth": 0}, {"key": "4160464d3fcba547cb1664e54ce51ad06f78b773", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.19806417983414829, "ground_truth": 0}, {"key": "4160464d3fcba547cb1664e54ce51ad06f78b773", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.4824291050893019, "ground_truth": 0}, {"key": "4160464d3fcba547cb1664e54ce51ad06f78b773", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.4416730258221216, "ground_truth": 0}, {"key": "4160464d3fcba547cb1664e54ce51ad06f78b773", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.6187804417560524, "ground_truth": 0}, {"key": "72b396634cc46f29b5ef146a61073ee7e7fa3cdc", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.428233383040659, "ground_truth": 0}, {"key": "72b396634cc46f29b5ef146a61073ee7e7fa3cdc", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.5907792197964976, "ground_truth": 0}, {"key": "72b396634cc46f29b5ef146a61073ee7e7fa3cdc", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.6315942983386219, "ground_truth": 0}, {"key": "72b396634cc46f29b5ef146a61073ee7e7fa3cdc", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.5544704840400193, "ground_truth": 0}, {"key": "72b396634cc46f29b5ef146a61073ee7e7fa3cdc", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.8116760133364712, "ground_truth": 0}, {"key": "b9b09b290cdf4d74cb64684a6cae8b6832645607", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.41869693525560464, "ground_truth": 0}, {"key": "b9b09b290cdf4d74cb64684a6cae8b6832645607", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.8068526341889657, "ground_truth": 0}, {"key": "b9b09b290cdf4d74cb64684a6cae8b6832645607", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.7356416256549636, "ground_truth": 0}, {"key": "b9b09b290cdf4d74cb64684a6cae8b6832645607", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.8969755722103263, "ground_truth": 0}, {"key": "b9b09b290cdf4d74cb64684a6cae8b6832645607", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.8140528067642081, "ground_truth": 0}, {"key": "9e49d58fa5ab7f3e4356cb61337605ac007c49ca", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.16667539231591577, "ground_truth": 0}, {"key": "9e49d58fa5ab7f3e4356cb61337605ac007c49ca", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.151027797982612, "ground_truth": 0}, {"key": "9e49d58fa5ab7f3e4356cb61337605ac007c49ca", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.30569732175664843, "ground_truth": 0}, {"key": "9e49d58fa5ab7f3e4356cb61337605ac007c49ca", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.3123700086644216, "ground_truth": 0}, {"key": "9e49d58fa5ab7f3e4356cb61337605ac007c49ca", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.1755380584978777, "ground_truth": 0}, {"key": "47fe0e2bba8206014fb53a7d5247efd1e316e087", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.31742627490397934, "ground_truth": 0}, {"key": "47fe0e2bba8206014fb53a7d5247efd1e316e087", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.5312093763450007, "ground_truth": 0}, {"key": "47fe0e2bba8206014fb53a7d5247efd1e316e087", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.0863234777846393, "ground_truth": 0}, {"key": "47fe0e2bba8206014fb53a7d5247efd1e316e087", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.40544874529482827, "ground_truth": 0}, {"key": "47fe0e2bba8206014fb53a7d5247efd1e316e087", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.1384617834766942, "ground_truth": 0}, {"key": "f54f84affaebd1d86011ad31adbf9fac4754a8f2", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.1710611899612815, "ground_truth": 0}, {"key": "f54f84affaebd1d86011ad31adbf9fac4754a8f2", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.14903531005735185, "ground_truth": 0}, {"key": "f54f84affaebd1d86011ad31adbf9fac4754a8f2", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.17553807514323383, "ground_truth": 0}, {"key": "f54f84affaebd1d86011ad31adbf9fac4754a8f2", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.23091975953365565, "ground_truth": 0}, {"key": "f54f84affaebd1d86011ad31adbf9fac4754a8f2", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.2240554619798461, "ground_truth": 0}, {"key": "bc4992871e25e6584936af456ad4b819dcc52f27", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.4225046526841524, "ground_truth": 0}, {"key": "bc4992871e25e6584936af456ad4b819dcc52f27", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.23792990634105976, "ground_truth": 0}, {"key": "bc4992871e25e6584936af456ad4b819dcc52f27", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.3073580221614414, "ground_truth": 0}, {"key": "bc4992871e25e6584936af456ad4b819dcc52f27", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.22815649121312134, "ground_truth": 0}, {"key": "bc4992871e25e6584936af456ad4b819dcc52f27", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.1285251392829477, "ground_truth": 0}, {"key": "271416bf0f15c52a4417339de78dcecf378b3950", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.7090191259282269, "ground_truth": 0}, {"key": "271416bf0f15c52a4417339de78dcecf378b3950", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.8233283991074795, "ground_truth": 0}, {"key": "271416bf0f15c52a4417339de78dcecf378b3950", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.6654105634375427, "ground_truth": 0}, {"key": "271416bf0f15c52a4417339de78dcecf378b3950", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.48633155279566515, "ground_truth": 0}, {"key": "271416bf0f15c52a4417339de78dcecf378b3950", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.5312093688356303, "ground_truth": 0}, {"key": "0add6b43e18072837f0bef41031d6f92f740d625", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.22135068555596352, "ground_truth": 0}, {"key": "0add6b43e18072837f0bef41031d6f92f740d625", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.2553436455653792, "ground_truth": 0}, {"key": "0add6b43e18072837f0bef41031d6f92f740d625", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.3775406746505081, "ground_truth": 0}, {"key": "0add6b43e18072837f0bef41031d6f92f740d625", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.5467381394326545, "ground_truth": 0}, {"key": "0add6b43e18072837f0bef41031d6f92f740d625", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.705785003468628, "ground_truth": 0}, {"key": "7060e3feb685bda7b5102e1cc8e9b35da37ca2a1", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.3398276399008225, "ground_truth": 0}, {"key": "7060e3feb685bda7b5102e1cc8e9b35da37ca2a1", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.28140559831885065, "ground_truth": 0}, {"key": "7060e3feb685bda7b5102e1cc8e9b35da37ca2a1", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.37204879967069976, "ground_truth": 0}, {"key": "7060e3feb685bda7b5102e1cc8e9b35da37ca2a1", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.1895210848710745, "ground_truth": 0}, {"key": "7060e3feb685bda7b5102e1cc8e9b35da37ca2a1", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.20181322084610734, "ground_truth": 0}, {"key": "04fbd3088e8610dd4d5bea709e7cc5ee3e53710d", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.2958398738441112, "ground_truth": 0}, {"key": "04fbd3088e8610dd4d5bea709e7cc5ee3e53710d", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.16995624317509858, "ground_truth": 0}, {"key": "04fbd3088e8610dd4d5bea709e7cc5ee3e53710d", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.09534946546825972, "ground_truth": 0}, {"key": "04fbd3088e8610dd4d5bea709e7cc5ee3e53710d", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.16132023408070353, "ground_truth": 0}, {"key": "04fbd3088e8610dd4d5bea709e7cc5ee3e53710d", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.30239108769370543, "ground_truth": 0}, {"key": "b198f0356c0f0cb09aba4d7d5541dd7c5ce91678", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.14128141919461587, "ground_truth": 0}, {"key": "b198f0356c0f0cb09aba4d7d5541dd7c5ce91678", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.5097643694503714, "ground_truth": 0}, {"key": "b198f0356c0f0cb09aba4d7d5541dd7c5ce91678", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.258325988975434, "ground_truth": 0}, {"key": "b198f0356c0f0cb09aba4d7d5541dd7c5ce91678", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.2735743912640298, "ground_truth": 0}, {"key": "b198f0356c0f0cb09aba4d7d5541dd7c5ce91678", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.13477591218752447, "ground_truth": 0}, {"key": "0f60442453e038c6bbe3aa525bedf2a97f459e04", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.4320633912503245, "ground_truth": 0}, {"key": "0f60442453e038c6bbe3aa525bedf2a97f459e04", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.5078118680983474, "ground_truth": 0}, {"key": "0f60442453e038c6bbe3aa525bedf2a97f459e04", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.37204878890325077, "ground_truth": 0}, {"key": "0f60442453e038c6bbe3aa525bedf2a97f459e04", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.6242935064532545, "ground_truth": 0}, {"key": "0f60442453e038c6bbe3aa525bedf2a97f459e04", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.571766600563806, "ground_truth": 0}, {"key": "79b423b90af6b3381ebfa34a7382ca472bdb5b35", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.29259530579648385, "ground_truth": 0}, {"key": "79b423b90af6b3381ebfa34a7382ca472bdb5b35", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.5448013955429482, "ground_truth": 0}, {"key": "79b423b90af6b3381ebfa34a7382ca472bdb5b35", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.2689414441530028, "ground_truth": 0}, {"key": "79b423b90af6b3381ebfa34a7382ca472bdb5b35", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.1460872471641768, "ground_truth": 0}, {"key": "79b423b90af6b3381ebfa34a7382ca472bdb5b35", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.3073580238507634, "ground_truth": 0}, {"key": "3e5a3a2dddee7ebebe57c12d0ace97a24cbabd72", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.20055767171075853, "ground_truth": 0}, {"key": "3e5a3a2dddee7ebebe57c12d0ace97a24cbabd72", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.13939638761799308, "ground_truth": 0}, {"key": "3e5a3a2dddee7ebebe57c12d0ace97a24cbabd72", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.5292633864811941, "ground_truth": 0}, {"key": "3e5a3a2dddee7ebebe57c12d0ace97a24cbabd72", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.15102779574804934, "ground_truth": 0}, {"key": "3e5a3a2dddee7ebebe57c12d0ace97a24cbabd72", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.21337718436333242, "ground_truth": 0}, {"key": "c623e4914c04811d354fa137e3bf7a00980ef7d7", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.5525396895117631, "ground_truth": 0}, {"key": "c623e4914c04811d354fa137e3bf7a00980ef7d7", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.3684057068246072, "ground_truth": 0}, {"key": "c623e4914c04811d354fa137e3bf7a00980ef7d7", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.67060829390232, "ground_truth": 0}, {"key": "c623e4914c04811d354fa137e3bf7a00980ef7d7", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.22678363644370664, "ground_truth": 0}, {"key": "c623e4914c04811d354fa137e3bf7a00980ef7d7", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.3328523454877455, "ground_truth": 0}, {"key": "d5ef1fb6f2df20e46fb032b9e318bc8555283e78", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.1037486307732158, "ground_truth": 0}, {"key": "d5ef1fb6f2df20e46fb032b9e318bc8555283e78", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.6495786373155855, "ground_truth": 0}, {"key": "d5ef1fb6f2df20e46fb032b9e318bc8555283e78", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.21733752148727298, "ground_truth": 0}, {"key": "d5ef1fb6f2df20e46fb032b9e318bc8555283e78", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.144148854301779, "ground_truth": 0}, {"key": "d5ef1fb6f2df20e46fb032b9e318bc8555283e78", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.18476751288277019, "ground_truth": 0}, {"key": "e1a36c50adadc5db9ffe6fd2c5e275d522902193", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.832236646857372, "ground_truth": 0}, {"key": "e1a36c50adadc5db9ffe6fd2c5e275d522902193", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.7446563492024707, "ground_truth": 0}, {"key": "e1a36c50adadc5db9ffe6fd2c5e275d522902193", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.4054487435540121, "ground_truth": 0}, {"key": "e1a36c50adadc5db9ffe6fd2c5e275d522902193", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.4205996137571747, "ground_truth": 0}, {"key": "e1a36c50adadc5db9ffe6fd2c5e275d522902193", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.5525397067755499, "ground_truth": 0}, {"key": "bad69c9a3c7d84a4717705a3063dd7367243772b", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.11047114454658703, "ground_truth": 0}, {"key": "bad69c9a3c7d84a4717705a3063dd7367243772b", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.2583260117527074, "ground_truth": 0}, {"key": "bad69c9a3c7d84a4717705a3063dd7367243772b", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.18952110174491119, "ground_truth": 0}, {"key": "bad69c9a3c7d84a4717705a3063dd7367243772b", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.07921031890231843, "ground_truth": 0}, {"key": "bad69c9a3c7d84a4717705a3063dd7367243772b", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.3451052457241526, "ground_truth": 0}, {"key": "4b40ad1f0e59b139e9a1466859ee08a048ca8d2c", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.39047583002217684, "ground_truth": 0}, {"key": "4b40ad1f0e59b139e9a1466859ee08a048ca8d2c", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.4016877996483775, "ground_truth": 0}, {"key": "4b40ad1f0e59b139e9a1466859ee08a048ca8d2c", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.6297746128462843, "ground_truth": 0}, {"key": "4b40ad1f0e59b139e9a1466859ee08a048ca8d2c", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.47657965823757237, "ground_truth": 0}, {"key": "4b40ad1f0e59b139e9a1466859ee08a048ca8d2c", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.4921881375431486, "ground_truth": 0}, {"key": "c17a30b4c0f8f58e3afa6279a39470f65a179f6b", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.359364144224551, "ground_truth": 0}, {"key": "c17a30b4c0f8f58e3afa6279a39470f65a179f6b", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.6976089212721382, "ground_truth": 0}, {"key": "c17a30b4c0f8f58e3afa6279a39470f65a179f6b", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.5097643848572655, "ground_truth": 0}, {"key": "c17a30b4c0f8f58e3afa6279a39470f65a179f6b", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.28298812396354256, "ground_truth": 0}, {"key": "c17a30b4c0f8f58e3afa6279a39470f65a179f6b", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.6548947261106686, "ground_truth": 0}, {"key": "6f579aad2d1f601b17e01057cd4b5e4942627230", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.17328820066310963, "ground_truth": 0}, {"key": "6f579aad2d1f601b17e01057cd4b5e4942627230", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.44167301489952976, "ground_truth": 0}, {"key": "6f579aad2d1f601b17e01057cd4b5e4942627230", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.3023910888340664, "ground_truth": 0}, {"key": "6f579aad2d1f601b17e01057cd4b5e4942627230", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.27048022575356345, "ground_truth": 0}, {"key": "6f579aad2d1f601b17e01057cd4b5e4942627230", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.3886180444536324, "ground_truth": 0}, {"key": "7551f8e13485bb1738c16eccad343a14a47b2903", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.40168781782883284, "ground_truth": 0}, {"key": "7551f8e13485bb1738c16eccad343a14a47b2903", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.35577488288363746, "ground_truth": 0}, {"key": "7551f8e13485bb1738c16eccad343a14a47b2903", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.3259495230342222, "ground_truth": 0}, {"key": "7551f8e13485bb1738c16eccad343a14a47b2903", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.3611647177424519, "ground_truth": 0}, {"key": "7551f8e13485bb1738c16eccad343a14a47b2903", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.3398276255676448, "ground_truth": 0}, {"key": "257d8d38863175ec9401d0532963fb71a47f0734", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.6619228667140749, "ground_truth": 0}, {"key": "257d8d38863175ec9401d0532963fb71a47f0734", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.4225046260887363, "ground_truth": 0}, {"key": "257d8d38863175ec9401d0532963fb71a47f0734", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.6169358180531341, "ground_truth": 0}, {"key": "257d8d38863175ec9401d0532963fb71a47f0734", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.766293651352082, "ground_truth": 0}, {"key": "257d8d38863175ec9401d0532963fb71a47f0734", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.5964331494237622, "ground_truth": 0}, {"key": "aa596e10dfe78dd875a7e15bfd53138bc8bde471", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.11516222866526661, "ground_truth": 0}, {"key": "aa596e10dfe78dd875a7e15bfd53138bc8bde471", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.13660840407244973, "ground_truth": 0}, {"key": "aa596e10dfe78dd875a7e15bfd53138bc8bde471", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.1375324686345031, "ground_truth": 0}, {"key": "aa596e10dfe78dd875a7e15bfd53138bc8bde471", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.05419873350101736, "ground_truth": 0}, {"key": "aa596e10dfe78dd875a7e15bfd53138bc8bde471", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.07211220100280094, "ground_truth": 0}, {"key": "a0dff972172125f32b79977a47b0d250be8f71e4", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.2323101594619573, "ground_truth": 0}, {"key": "a0dff972172125f32b79977a47b0d250be8f71e4", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.7431679964558321, "ground_truth": 0}, {"key": "a0dff972172125f32b79977a47b0d250be8f71e4", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.2254166056258942, "ground_truth": 0}, {"key": "a0dff972172125f32b79977a47b0d250be8f71e4", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.19072402245556638, "ground_truth": 0}, {"key": "a0dff972172125f32b79977a47b0d250be8f71e4", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.30569733088984974, "ground_truth": 0}, {"key": "faac3a6337907b1552b7068c8701cae665c4885c", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.14414884400226904, "ground_truth": 0}, {"key": "faac3a6337907b1552b7068c8701cae665c4885c", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.3998116524771099, "ground_truth": 0}, {"key": "faac3a6337907b1552b7068c8701cae665c4885c", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.16132024136784567, "ground_truth": 0}, {"key": "faac3a6337907b1552b7068c8701cae665c4885c", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.3647775607988421, "ground_truth": 0}, {"key": "faac3a6337907b1552b7068c8701cae665c4885c", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.35220180163582504, "ground_truth": 0}, {"key": "c741b211364d761605050776064a506d24378d10", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.15002882077639024, "ground_truth": 0}, {"key": "c741b211364d761605050776064a506d24378d10", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.24944725169718834, "ground_truth": 0}, {"key": "c741b211364d761605050776064a506d24378d10", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.0953494600922548, "ground_truth": 0}, {"key": "c741b211364d761605050776064a506d24378d10", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.28457601082093653, "ground_truth": 0}, {"key": "c741b211364d761605050776064a506d24378d10", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.16559312120628536, "ground_truth": 0}, {"key": "a062b8ba08369be2364a863020a28de63a3cbf86", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.35577486971694583, "ground_truth": 0}, {"key": "a062b8ba08369be2364a863020a28de63a3cbf86", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.5428632735896384, "ground_truth": 0}, {"key": "a062b8ba08369be2364a863020a28de63a3cbf86", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.3886180245810237, "ground_truth": 0}, {"key": "a062b8ba08369be2364a863020a28de63a3cbf86", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.18594720020360792, "ground_truth": 0}, {"key": "a062b8ba08369be2364a863020a28de63a3cbf86", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.348645151100193, "ground_truth": 0}, {"key": "f11102404d23702fe398b1d690d13418703e617a", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.44939263548049246, "ground_truth": 0}, {"key": "f11102404d23702fe398b1d690d13418703e617a", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.6095241643371593, "ground_truth": 0}, {"key": "f11102404d23702fe398b1d690d13418703e617a", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.6477982245311563, "ground_truth": 0}, {"key": "f11102404d23702fe398b1d690d13418703e617a", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.7090191529142735, "ground_truth": 0}, {"key": "f11102404d23702fe398b1d690d13418703e617a", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.6224593551280614, "ground_truth": 0}, {"key": "62481fda7e7b9714b994617909349550707fe8a7", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.45132652705261495, "ground_truth": 0}, {"key": "62481fda7e7b9714b994617909349550707fe8a7", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.6584174901909587, "ground_truth": 0}, {"key": "62481fda7e7b9714b994617909349550707fe8a7", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.40922077878913166, "ground_truth": 0}, {"key": "62481fda7e7b9714b994617909349550707fe8a7", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.45713671571203235, "ground_truth": 0}, {"key": "62481fda7e7b9714b994617909349550707fe8a7", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.6424324851794663, "ground_truth": 0}, {"key": "13943ef2d9c3b737c9a900f0cdb32a9c39121e6f", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.5983122027793989, "ground_truth": 0}, {"key": "13943ef2d9c3b737c9a900f0cdb32a9c39121e6f", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.5486734867014469, "ground_truth": 0}, {"key": "13943ef2d9c3b737c9a900f0cdb32a9c39121e6f", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.09739040037621297, "ground_truth": 0}, {"key": "13943ef2d9c3b737c9a900f0cdb32a9c39121e6f", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.5774953661180482, "ground_truth": 0}, {"key": "13943ef2d9c3b737c9a900f0cdb32a9c39121e6f", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.27048023553946243, "ground_truth": 0}, {"key": "0c25e0cd62589fde1b378606febbcc5a2bafc770", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.7170118725319077, "ground_truth": 0}, {"key": "0c25e0cd62589fde1b378606febbcc5a2bafc770", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.7549149808912282, "ground_truth": 0}, {"key": "0c25e0cd62589fde1b378606febbcc5a2bafc770", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.5621764868310903, "ground_truth": 0}, {"key": "0c25e0cd62589fde1b378606febbcc5a2bafc770", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.7154240063313718, "ground_truth": 0}, {"key": "0c25e0cd62589fde1b378606febbcc5a2bafc770", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.6477982068366243, "ground_truth": 0}, {"key": "a86bc16fad35d84e988af4cc64bf14877337d47e", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.2814056136271688, "ground_truth": 0}, {"key": "a86bc16fad35d84e988af4cc64bf14877337d47e", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.41679663765371133, "ground_truth": 0}, {"key": "a86bc16fad35d84e988af4cc64bf14877337d47e", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.36840571036832703, "ground_truth": 0}, {"key": "a86bc16fad35d84e988af4cc64bf14877337d47e", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.25238405293454, "ground_truth": 0}, {"key": "a86bc16fad35d84e988af4cc64bf14877337d47e", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.22270013413972892, "ground_truth": 0}, {"key": "0f937bcc8cd07bab2d5aa9a4492d3c2430063b67", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.19682622240232917, "ground_truth": 0}, {"key": "0f937bcc8cd07bab2d5aa9a4492d3c2430063b67", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.28616926188438446, "ground_truth": 0}, {"key": "0f937bcc8cd07bab2d5aa9a4492d3c2430063b67", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.4436004281202603, "ground_truth": 0}, {"key": "0f937bcc8cd07bab2d5aa9a4492d3c2430063b67", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.2583259794896141, "ground_truth": 0}, {"key": "0f937bcc8cd07bab2d5aa9a4492d3c2430063b67", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.14608725274159146, "ground_truth": 0}, {"key": "a6c0617d92807f05f02d767261c45b616382e499", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.278256794639928, "ground_truth": 0}, {"key": "a6c0617d92807f05f02d767261c45b616382e499", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.2925952706821763, "ground_truth": 0}, {"key": "a6c0617d92807f05f02d767261c45b616382e499", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.15203224575983906, "ground_truth": 0}, {"key": "a6c0617d92807f05f02d767261c45b616382e499", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.1677633345371021, "ground_truth": 0}, {"key": "a6c0617d92807f05f02d767261c45b616382e499", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.18126321629694425, "ground_truth": 0}, {"key": "4f45a0576d353fa9b5b9d1c8e3cc0e6a1cd4897b", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.23792989286949004, "ground_truth": 0}, {"key": "4f45a0576d353fa9b5b9d1c8e3cc0e6a1cd4897b", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.5389832098985218, "ground_truth": 0}, {"key": "4f45a0576d353fa9b5b9d1c8e3cc0e6a1cd4897b", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.3557748798108582, "ground_truth": 0}, {"key": "4f45a0576d353fa9b5b9d1c8e3cc0e6a1cd4897b", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.3557748893472888, "ground_truth": 0}, {"key": "4f45a0576d353fa9b5b9d1c8e3cc0e6a1cd4897b", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.7170118622806841, "ground_truth": 0}, {"key": "f6d43a207c2b3c48e787087b345c23d2fb1dc92f", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.2254166080091614, "ground_truth": 0}, {"key": "f6d43a207c2b3c48e787087b345c23d2fb1dc92f", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.413003569772298, "ground_truth": 0}, {"key": "f6d43a207c2b3c48e787087b345c23d2fb1dc92f", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.1919327864404468, "ground_truth": 0}, {"key": "f6d43a207c2b3c48e787087b345c23d2fb1dc92f", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.22953520582344067, "ground_truth": 0}, {"key": "f6d43a207c2b3c48e787087b345c23d2fb1dc92f", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.2751297197602459, "ground_truth": 0}, {"key": "e0127487aee3a00fe164d72eb697221079518471", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.6791786902749495, "ground_truth": 0}, {"key": "e0127487aee3a00fe164d72eb697221079518471", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.7341195249432771, "ground_truth": 0}, {"key": "e0127487aee3a00fe164d72eb697221079518471", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.6566582653604369, "ground_truth": 0}, {"key": "e0127487aee3a00fe164d72eb697221079518471", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.4726834849233434, "ground_truth": 0}, {"key": "e0127487aee3a00fe164d72eb697221079518471", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.3242354032186202, "ground_truth": 0}, {"key": "2f3af8decce1c0a6cd22b21df96acd40b14bb62b", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.27669052534070543, "ground_truth": 0}, {"key": "2f3af8decce1c0a6cd22b21df96acd40b14bb62b", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.3684057097814899, "ground_truth": 0}, {"key": "2f3af8decce1c0a6cd22b21df96acd40b14bb62b", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.33982762735576977, "ground_truth": 0}, {"key": "2f3af8decce1c0a6cd22b21df96acd40b14bb62b", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.2845760047509393, "ground_truth": 0}, {"key": "2f3af8decce1c0a6cd22b21df96acd40b14bb62b", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.3090237091961556, "ground_truth": 0}, {"key": "13a366f303e6ea2f07c353a9f5fb49a44840f808", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.2598256394630373, "ground_truth": 0}, {"key": "13a366f303e6ea2f07c353a9f5fb49a44840f808", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.37937840657530036, "ground_truth": 0}, {"key": "13a366f303e6ea2f07c353a9f5fb49a44840f808", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.6206216112142584, "ground_truth": 0}, {"key": "13a366f303e6ea2f07c353a9f5fb49a44840f808", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.23510838799476494, "ground_truth": 0}, {"key": "13a366f303e6ea2f07c353a9f5fb49a44840f808", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.7090191583029096, "ground_truth": 0}, {"key": "ee36a8b5db09b9e9a6d462116539ffc095d5c017", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.2735743783591877, "ground_truth": 0}, {"key": "ee36a8b5db09b9e9a6d462116539ffc095d5c017", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.4320633510955094, "ground_truth": 0}, {"key": "ee36a8b5db09b9e9a6d462116539ffc095d5c017", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.33458943912679173, "ground_truth": 0}, {"key": "ee36a8b5db09b9e9a6d462116539ffc095d5c017", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.6671476639911865, "ground_truth": 0}, {"key": "ee36a8b5db09b9e9a6d462116539ffc095d5c017", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.19559407115546187, "ground_truth": 0}, {"key": "d3b3bcf90226a694361cb27f1a4d481c79b7368a", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.2553436471950203, "ground_truth": 0}, {"key": "d3b3bcf90226a694361cb27f1a4d481c79b7368a", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.3056973355257234, "ground_truth": 0}, {"key": "d3b3bcf90226a694361cb27f1a4d481c79b7368a", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.4035668540952909, "ground_truth": 0}, {"key": "d3b3bcf90226a694361cb27f1a4d481c79b7368a", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.5525397028632503, "ground_truth": 0}, {"key": "d3b3bcf90226a694361cb27f1a4d481c79b7368a", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.2909808690528823, "ground_truth": 0}, {"key": "e5e837f2cc75fc44ebf826822aa4c9dc59344b8b", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.2553436523783782, "ground_truth": 0}, {"key": "e5e837f2cc75fc44ebf826822aa4c9dc59344b8b", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.4148988362350589, "ground_truth": 0}, {"key": "e5e837f2cc75fc44ebf826822aa4c9dc59344b8b", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.1883239905766118, "ground_truth": 0}, {"key": "e5e837f2cc75fc44ebf826822aa4c9dc59344b8b", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.2509127792621496, "ground_truth": 0}, {"key": "e5e837f2cc75fc44ebf826822aa4c9dc59344b8b", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.13753246596772523, "ground_truth": 0}, {"key": "1317a869cc1d6d534a93eaad67fb6550aa155ae6", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.753466659265369, "ground_truth": 0}, {"key": "1317a869cc1d6d534a93eaad67fb6550aa155ae6", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.8006919902968284, "ground_truth": 0}, {"key": "1317a869cc1d6d534a93eaad67fb6550aa155ae6", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.6020615744704841, "ground_truth": 0}, {"key": "1317a869cc1d6d534a93eaad67fb6550aa155ae6", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.6076631712343926, "ground_truth": 0}, {"key": "1317a869cc1d6d534a93eaad67fb6550aa155ae6", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.8509646904473795, "ground_truth": 0}, {"key": "f856ca4cd15992e0e88ae9113bf31b2a5ab55072", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.7074046983959356, "ground_truth": 0}, {"key": "f856ca4cd15992e0e88ae9113bf31b2a5ab55072", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.7025300686927755, "ground_truth": 0}, {"key": "f856ca4cd15992e0e88ae9113bf31b2a5ab55072", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.7676898671221369, "ground_truth": 0}, {"key": "f856ca4cd15992e0e88ae9113bf31b2a5ab55072", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.5563995897378522, "ground_truth": 0}, {"key": "f856ca4cd15992e0e88ae9113bf31b2a5ab55072", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.4843800901724575, "ground_truth": 0}, {"key": "438e8eaa1c64cb59288f9954355d0100181d19a2", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.5058590795680428, "ground_truth": 0}, {"key": "438e8eaa1c64cb59288f9954355d0100181d19a2", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.27202454986069274, "ground_truth": 0}, {"key": "438e8eaa1c64cb59288f9954355d0100181d19a2", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.332852326136691, "ground_truth": 0}, {"key": "438e8eaa1c64cb59288f9954355d0100181d19a2", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.47073658725278417, "ground_truth": 0}, {"key": "438e8eaa1c64cb59288f9954355d0100181d19a2", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.4551986256606886, "ground_truth": 0}, {"key": "470618f9fd48a5d134a44b5de166b625f596a0b3", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.7476159527735675, "ground_truth": 0}, {"key": "470618f9fd48a5d134a44b5de166b625f596a0b3", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.7931059324620537, "ground_truth": 0}, {"key": "470618f9fd48a5d134a44b5de166b625f596a0b3", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.8479677464378353, "ground_truth": 0}, {"key": "470618f9fd48a5d134a44b5de166b625f596a0b3", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.4339814764076926, "ground_truth": 0}, {"key": "470618f9fd48a5d134a44b5de166b625f596a0b3", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.7505527596935858, "ground_truth": 0}, {"key": "751e8f720d24c57e79cf63d9a3f72cd80c5d9619", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.6150878358181225, "ground_truth": 0}, {"key": "751e8f720d24c57e79cf63d9a3f72cd80c5d9619", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.5350984137128368, "ground_truth": 0}, {"key": "751e8f720d24c57e79cf63d9a3f72cd80c5d9619", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.4416730194592647, "ground_truth": 0}, {"key": "751e8f720d24c57e79cf63d9a3f72cd80c5d9619", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.21866938283012274, "ground_truth": 0}, {"key": "751e8f720d24c57e79cf63d9a3f72cd80c5d9619", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.07316471751504693, "ground_truth": 0}, {"key": "6a985a1090f146976d33c8b33342320a65a50211", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.23934933144094617, "ground_truth": 0}, {"key": "6a985a1090f146976d33c8b33342320a65a50211", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.26740815874205737, "ground_truth": 0}, {"key": "6a985a1090f146976d33c8b33342320a65a50211", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.39793840241723694, "ground_truth": 0}, {"key": "6a985a1090f146976d33c8b33342320a65a50211", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.5983121822156495, "ground_truth": 0}, {"key": "6a985a1090f146976d33c8b33342320a65a50211", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.4092208101888601, "ground_truth": 0}, {"key": "4640d2f968f31bcf384d8253e055611b10f4a38b", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.4687906352874274, "ground_truth": 0}, {"key": "4640d2f968f31bcf384d8253e055611b10f4a38b", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.3998116619827026, "ground_truth": 0}, {"key": "4640d2f968f31bcf384d8253e055611b10f4a38b", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.5679366199388464, "ground_truth": 0}, {"key": "4640d2f968f31bcf384d8253e055611b10f4a38b", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.3886180149081686, "ground_truth": 0}, {"key": "4640d2f968f31bcf384d8253e055611b10f4a38b", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.42059959780433964, "ground_truth": 0}, {"key": "22e0c9ba3465840583a5fd79714d2f7663c7e3a1", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.17217184755402726, "ground_truth": 0}, {"key": "22e0c9ba3465840583a5fd79714d2f7663c7e3a1", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.3157359759403998, "ground_truth": 0}, {"key": "22e0c9ba3465840583a5fd79714d2f7663c7e3a1", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.08389038700878464, "ground_truth": 0}, {"key": "22e0c9ba3465840583a5fd79714d2f7663c7e3a1", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.2613309177381319, "ground_truth": 0}, {"key": "22e0c9ba3465840583a5fd79714d2f7663c7e3a1", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.31912138737795065, "ground_truth": 0}, {"key": "10dafcc21761c60f8fc5bd832daf8f21cf0fc66d", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.12168575041987495, "ground_truth": 0}, {"key": "10dafcc21761c60f8fc5bd832daf8f21cf0fc66d", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.21337717052930838, "ground_truth": 0}, {"key": "10dafcc21761c60f8fc5bd832daf8f21cf0fc66d", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.1688569508260734, "ground_truth": 0}, {"key": "10dafcc21761c60f8fc5bd832daf8f21cf0fc66d", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.17441027232371667, "ground_truth": 0}, {"key": "10dafcc21761c60f8fc5bd832daf8f21cf0fc66d", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.2281565036126287, "ground_truth": 0}, {"key": "75da85a72e0028e1b07c65f6b771a1eaa20b4e04", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.145115358152379, "ground_truth": 0}, {"key": "75da85a72e0028e1b07c65f6b771a1eaa20b4e04", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.1216857448411662, "ground_truth": 0}, {"key": "75da85a72e0028e1b07c65f6b771a1eaa20b4e04", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.29098085408648605, "ground_truth": 0}, {"key": "75da85a72e0028e1b07c65f6b771a1eaa20b4e04", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.21076630382413347, "ground_truth": 0}, {"key": "75da85a72e0028e1b07c65f6b771a1eaa20b4e04", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.36477754314235233, "ground_truth": 0}, {"key": "9166b4c77e919f7a7cc457f9df981512dea3694f", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.22815649764402868, "ground_truth": 0}, {"key": "9166b4c77e919f7a7cc457f9df981512dea3694f", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.5964331236338525, "ground_truth": 0}, {"key": "9166b4c77e919f7a7cc457f9df981512dea3694f", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.46295862969280765, "ground_truth": 0}, {"key": "9166b4c77e919f7a7cc457f9df981512dea3694f", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.6187804408169191, "ground_truth": 0}, {"key": "9166b4c77e919f7a7cc457f9df981512dea3694f", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.7718435097166455, "ground_truth": 0}, {"key": "81e50c6cdbea4e55af6307d653135ef395b6d7fe", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.8757869982859964, "ground_truth": 0}, {"key": "81e50c6cdbea4e55af6307d653135ef395b6d7fe", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.9469902263951812, "ground_truth": 0}, {"key": "81e50c6cdbea4e55af6307d653135ef395b6d7fe", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.9219218350939539, "ground_truth": 0}, {"key": "81e50c6cdbea4e55af6307d653135ef395b6d7fe", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.9309620711625181, "ground_truth": 0}, {"key": "81e50c6cdbea4e55af6307d653135ef395b6d7fe", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.8469578533699843, "ground_truth": 0}, {"key": "59fa6c3439d216272cc845d35627f8eb11b08a6d", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.5097643817321332, "ground_truth": 0}, {"key": "59fa6c3439d216272cc845d35627f8eb11b08a6d", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.41111086243182277, "ground_truth": 0}, {"key": "59fa6c3439d216272cc845d35627f8eb11b08a6d", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.453261864709301, "ground_truth": 0}, {"key": "59fa6c3439d216272cc845d35627f8eb11b08a6d", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.43014735204946775, "ground_truth": 0}, {"key": "59fa6c3439d216272cc845d35627f8eb11b08a6d", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.5175708850569284, "ground_truth": 0}, {"key": "2eff3ba44cfaefbff89ebc764828ae9e4d477c9b", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.12421300361710312, "ground_truth": 0}, {"key": "2eff3ba44cfaefbff89ebc764828ae9e4d477c9b", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.4016878023816079, "ground_truth": 0}, {"key": "2eff3ba44cfaefbff89ebc764828ae9e4d477c9b", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.19314737064627155, "ground_truth": 0}, {"key": "2eff3ba44cfaefbff89ebc764828ae9e4d477c9b", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.2829881298374156, "ground_truth": 0}, {"key": "2eff3ba44cfaefbff89ebc764828ae9e4d477c9b", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.46684560954604737, "ground_truth": 0}, {"key": "74698ee383888faf5a49b32ecb8211b888270b76", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.3023910876313978, "ground_truth": 0}, {"key": "74698ee383888faf5a49b32ecb8211b888270b76", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.20817893051924383, "ground_truth": 0}, {"key": "74698ee383888faf5a49b32ecb8211b888270b76", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.5813030810161949, "ground_truth": 0}, {"key": "74698ee383888faf5a49b32ecb8211b888270b76", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.7122321739465047, "ground_truth": 0}, {"key": "74698ee383888faf5a49b32ecb8211b888270b76", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.12421301046496151, "ground_truth": 0}, {"key": "79a6d24f452d8c1cef47ab224fd2083b0d08324c", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.2160115386941824, "ground_truth": 0}, {"key": "79a6d24f452d8c1cef47ab224fd2083b0d08324c", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.6909762928759826, "ground_truth": 0}, {"key": "79a6d24f452d8c1cef47ab224fd2083b0d08324c", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.386763427888815, "ground_truth": 0}, {"key": "79a6d24f452d8c1cef47ab224fd2083b0d08324c", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.14706452307827683, "ground_truth": 0}, {"key": "79a6d24f452d8c1cef47ab224fd2083b0d08324c", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.531209374555402, "ground_truth": 0}, {"key": "50f2041a2bed7f316d3254192c4158095eeec2e9", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.2925952950386125, "ground_truth": 0}, {"key": "50f2041a2bed7f316d3254192c4158095eeec2e9", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.43974734824684186, "ground_truth": 0}, {"key": "50f2041a2bed7f316d3254192c4158095eeec2e9", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.28298812650686805, "ground_truth": 0}, {"key": "50f2041a2bed7f316d3254192c4158095eeec2e9", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.24653334809822466, "ground_truth": 0}, {"key": "50f2041a2bed7f316d3254192c4158095eeec2e9", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.3942009296159305, "ground_truth": 0}, {"key": "de6ed8db6d639706f2c5015c699fc578e4aa43ec", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.35398630155184074, "ground_truth": 0}, {"key": "de6ed8db6d639706f2c5015c699fc578e4aa43ec", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.33807712549324614, "ground_truth": 0}, {"key": "de6ed8db6d639706f2c5015c699fc578e4aa43ec", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.3867634504037118, "ground_truth": 0}, {"key": "de6ed8db6d639706f2c5015c699fc578e4aa43ec", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.3793783855587174, "ground_truth": 0}, {"key": "de6ed8db6d639706f2c5015c699fc578e4aa43ec", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.41489882944612394, "ground_truth": 0}, {"key": "8abb66a9697a8c59348fcc79de126691e394bded", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.3775406856666643, "ground_truth": 0}, {"key": "8abb66a9697a8c59348fcc79de126691e394bded", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.2861692497677297, "ground_truth": 0}, {"key": "8abb66a9697a8c59348fcc79de126691e394bded", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.5409238580852795, "ground_truth": 0}, {"key": "8abb66a9697a8c59348fcc79de126691e394bded", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.7170118816792873, "ground_truth": 0}, {"key": "8abb66a9697a8c59348fcc79de126691e394bded", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.40356687282181747, "ground_truth": 0}, {"key": "11ec3be451b57e4312b44eeabb3ae441435c662e", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.3140505483746149, "ground_truth": 0}, {"key": "11ec3be451b57e4312b44eeabb3ae441435c662e", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.4148988326119894, "ground_truth": 0}, {"key": "11ec3be451b57e4312b44eeabb3ae441435c662e", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.11047114661007575, "ground_truth": 0}, {"key": "11ec3be451b57e4312b44eeabb3ae441435c662e", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.3106943865733851, "ground_truth": 0}, {"key": "11ec3be451b57e4312b44eeabb3ae441435c662e", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.32939172395972555, "ground_truth": 0}, {"key": "eed527dece78deffed54a7cdd8516c4d57a90011", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.8807970797032982, "ground_truth": 0}, {"key": "eed527dece78deffed54a7cdd8516c4d57a90011", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.83004375530243, "ground_truth": 0}, {"key": "eed527dece78deffed54a7cdd8516c4d57a90011", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.7634837628416776, "ground_truth": 0}, {"key": "eed527dece78deffed54a7cdd8516c4d57a90011", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.7461389777509793, "ground_truth": 0}, {"key": "eed527dece78deffed54a7cdd8516c4d57a90011", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.8840392861179667, "ground_truth": 0}, {"key": "803c0dc8b3d2eb528fd084b613dfc29d98151d72", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.5964331477495509, "ground_truth": 0}, {"key": "803c0dc8b3d2eb528fd084b613dfc29d98151d72", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.8056321647340406, "ground_truth": 0}, {"key": "803c0dc8b3d2eb528fd084b613dfc29d98151d72", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.7295197719102915, "ground_truth": 0}, {"key": "803c0dc8b3d2eb528fd084b613dfc29d98151d72", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.3867634271348318, "ground_truth": 0}, {"key": "803c0dc8b3d2eb528fd084b613dfc29d98151d72", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.38676342183320356, "ground_truth": 0}, {"key": "d4fb4cca753c0f5586bd93bb124b0491711396d9", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.331119747883067, "ground_truth": 0}, {"key": "d4fb4cca753c0f5586bd93bb124b0491711396d9", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.278256760804085, "ground_truth": 0}, {"key": "d4fb4cca753c0f5586bd93bb124b0491711396d9", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.18713267426603813, "ground_truth": 0}, {"key": "d4fb4cca753c0f5586bd93bb124b0491711396d9", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.14223189242016965, "ground_truth": 0}, {"key": "d4fb4cca753c0f5586bd93bb124b0491711396d9", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.07978201691488146, "ground_truth": 0}, {"key": "723443b1c16e2276a1aa03259a600044e86c2538", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.2018132246183508, "ground_truth": 0}, {"key": "723443b1c16e2276a1aa03259a600044e86c2538", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.537041387873039, "ground_truth": 0}, {"key": "723443b1c16e2276a1aa03259a600044e86c2538", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.3468730917542127, "ground_truth": 0}, {"key": "723443b1c16e2276a1aa03259a600044e86c2538", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.24798745099728586, "ground_truth": 0}, {"key": "723443b1c16e2276a1aa03259a600044e86c2538", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.2909808826379177, "ground_truth": 0}, {"key": "b30a8f4dbb4f8375a8a9c2ccb4f658cc66dca0f5", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.2735743862243215, "ground_truth": 0}, {"key": "b30a8f4dbb4f8375a8a9c2ccb4f658cc66dca0f5", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.2942149677919543, "ground_truth": 0}, {"key": "b30a8f4dbb4f8375a8a9c2ccb4f658cc66dca0f5", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.49023562446058705, "ground_truth": 0}, {"key": "b30a8f4dbb4f8375a8a9c2ccb4f658cc66dca0f5", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.4301473579900435, "ground_truth": 0}, {"key": "b30a8f4dbb4f8375a8a9c2ccb4f658cc66dca0f5", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.5117165774876372, "ground_truth": 0}, {"key": "f874dc1da36d2c45a65f78dc0dc9dcdf5846c3c9", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.19559408577609694, "ground_truth": 0}, {"key": "f874dc1da36d2c45a65f78dc0dc9dcdf5846c3c9", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.7325918308834523, "ground_truth": 0}, {"key": "f874dc1da36d2c45a65f78dc0dc9dcdf5846c3c9", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.23792989232398437, "ground_truth": 0}, {"key": "f874dc1da36d2c45a65f78dc0dc9dcdf5846c3c9", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.29259532312432096, "ground_truth": 0}, {"key": "f874dc1da36d2c45a65f78dc0dc9dcdf5846c3c9", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.45907612772192363, "ground_truth": 0}, {"key": "60fc2801c429858cc0a87e547f1c30e34a7a96f3", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.4571367090936973, "ground_truth": 0}, {"key": "60fc2801c429858cc0a87e547f1c30e34a7a96f3", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.14706452653516597, "ground_truth": 0}, {"key": "60fc2801c429858cc0a87e547f1c30e34a7a96f3", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.1744102795761327, "ground_truth": 0}, {"key": "60fc2801c429858cc0a87e547f1c30e34a7a96f3", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.0987725897701457, "ground_truth": 0}, {"key": "60fc2801c429858cc0a87e547f1c30e34a7a96f3", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.20307462473771157, "ground_truth": 0}, {"key": "d885b755dab03a11c7e3b19455b82859a6e1f76b", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.25683199371476545, "ground_truth": 0}, {"key": "d885b755dab03a11c7e3b19455b82859a6e1f76b", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.6808786034443387, "ground_truth": 0}, {"key": "d885b755dab03a11c7e3b19455b82859a6e1f76b", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.505859127347939, "ground_truth": 0}, {"key": "d885b755dab03a11c7e3b19455b82859a6e1f76b", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.2766905273359138, "ground_truth": 0}, {"key": "d885b755dab03a11c7e3b19455b82859a6e1f76b", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.15610489799529625, "ground_truth": 0}, {"key": "9ce486aae2ad61c78b2e44d2617276a470c9f600", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.3775406718783013, "ground_truth": 0}, {"key": "9ce486aae2ad61c78b2e44d2617276a470c9f600", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.7279754423035021, "ground_truth": 0}, {"key": "9ce486aae2ad61c78b2e44d2617276a470c9f600", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.4746311880862387, "ground_truth": 0}, {"key": "9ce486aae2ad61c78b2e44d2617276a470c9f600", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.3433417440734098, "ground_truth": 0}, {"key": "9ce486aae2ad61c78b2e44d2617276a470c9f600", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.3259495305644347, "ground_truth": 0}, {"key": "162e54974cad1d0e067a97e37175951c26f13a0e", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.8749346079799056, "ground_truth": 0}, {"key": "162e54974cad1d0e067a97e37175951c26f13a0e", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.6992544010835788, "ground_truth": 0}, {"key": "162e54974cad1d0e067a97e37175951c26f13a0e", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.5058590916398873, "ground_truth": 0}, {"key": "162e54974cad1d0e067a97e37175951c26f13a0e", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.84389509795698, "ground_truth": 0}, {"key": "162e54974cad1d0e067a97e37175951c26f13a0e", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.8887587898366656, "ground_truth": 0}, {"key": "03a0cef9c902928979ef731616fb96bd1fb10f9f", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.6513548522621849, "ground_truth": 0}, {"key": "03a0cef9c902928979ef731616fb96bd1fb10f9f", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.4921881112106236, "ground_truth": 0}, {"key": "03a0cef9c902928979ef731616fb96bd1fb10f9f", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.4590761374595177, "ground_truth": 0}, {"key": "03a0cef9c902928979ef731616fb96bd1fb10f9f", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.7090191313400396, "ground_truth": 0}, {"key": "03a0cef9c902928979ef731616fb96bd1fb10f9f", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.4416730146348842, "ground_truth": 0}, {"key": "6f64897fc65e1ba7531a4830a7d935ab15d8bec6", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.3738758252505311, "ground_truth": 0}, {"key": "6f64897fc65e1ba7531a4830a7d935ab15d8bec6", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.3090237062215349, "ground_truth": 0}, {"key": "6f64897fc65e1ba7531a4830a7d935ab15d8bec6", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.38306420429532745, "ground_truth": 0}, {"key": "6f64897fc65e1ba7531a4830a7d935ab15d8bec6", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.13753246724440432, "ground_truth": 0}, {"key": "6f64897fc65e1ba7531a4830a7d935ab15d8bec6", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.2991052035865542, "ground_truth": 0}, {"key": "0d7383a44955b41c5a472151a35a842751f0004c", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.16026603378680176, "ground_truth": 0}, {"key": "0d7383a44955b41c5a472151a35a842751f0004c", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.16776334927176628, "ground_truth": 0}, {"key": "0d7383a44955b41c5a472151a35a842751f0004c", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.28616923939178734, "ground_truth": 0}, {"key": "0d7383a44955b41c5a472151a35a842751f0004c", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.3830641566263213, "ground_truth": 0}, {"key": "0d7383a44955b41c5a472151a35a842751f0004c", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.43206337247671417, "ground_truth": 0}, {"key": "2fddefe691f7849048548a15f6533339d4a25bfd", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.37387581931708425, "ground_truth": 0}, {"key": "2fddefe691f7849048548a15f6533339d4a25bfd", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.3191213996155553, "ground_truth": 0}, {"key": "2fddefe691f7849048548a15f6533339d4a25bfd", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.11201595311377965, "ground_truth": 0}, {"key": "2fddefe691f7849048548a15f6533339d4a25bfd", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.3293917166856173, "ground_truth": 0}, {"key": "2fddefe691f7849048548a15f6533339d4a25bfd", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.3363310499844664, "ground_truth": 0}, {"key": "e35ec8afe496d466d673ac67d80ec5c21b163410", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.6224593319845038, "ground_truth": 0}, {"key": "e35ec8afe496d466d673ac67d80ec5c21b163410", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.2942149677919543, "ground_truth": 0}, {"key": "e35ec8afe496d466d673ac67d80ec5c21b163410", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.7772998556522646, "ground_truth": 0}, {"key": "e35ec8afe496d466d673ac67d80ec5c21b163410", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.5156199079586098, "ground_truth": 0}, {"key": "e35ec8afe496d466d673ac67d80ec5c21b163410", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.6150878462905701, "ground_truth": 0}, {"key": "b4aa207f0723ae8a731dbc07ecdb03a68a42031f", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.2814056081689783, "ground_truth": 0}, {"key": "b4aa207f0723ae8a731dbc07ecdb03a68a42031f", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.10818894805157339, "ground_truth": 0}, {"key": "b4aa207f0723ae8a731dbc07ecdb03a68a42031f", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.48242911937261207, "ground_truth": 0}, {"key": "b4aa207f0723ae8a731dbc07ecdb03a68a42031f", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.35756752591024854, "ground_truth": 0}, {"key": "b4aa207f0723ae8a731dbc07ecdb03a68a42031f", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.44746030343344884, "ground_truth": 0}, {"key": "a65ecd71682863f7b12ca11ab8ac23b39ae302c4", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.26894144685735677, "ground_truth": 0}, {"key": "a65ecd71682863f7b12ca11ab8ac23b39ae302c4", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.6774740026843727, "ground_truth": 0}, {"key": "a65ecd71682863f7b12ca11ab8ac23b39ae302c4", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.1250653796009568, "ground_truth": 0}, {"key": "a65ecd71682863f7b12ca11ab8ac23b39ae302c4", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.11516223507577311, "ground_truth": 0}, {"key": "a65ecd71682863f7b12ca11ab8ac23b39ae302c4", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.1613202391651762, "ground_truth": 0}, {"key": "215a2a64c7bd36360f76ec5e159690de07d7d959", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.39793841097312976, "ground_truth": 0}, {"key": "215a2a64c7bd36360f76ec5e159690de07d7d959", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.4824291269468491, "ground_truth": 0}, {"key": "215a2a64c7bd36360f76ec5e159690de07d7d959", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.3073580189461456, "ground_truth": 0}, {"key": "215a2a64c7bd36360f76ec5e159690de07d7d959", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.5851011619617896, "ground_truth": 0}, {"key": "215a2a64c7bd36360f76ec5e159690de07d7d959", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.47463117625114115, "ground_truth": 0}, {"key": "39074eb06df4966d1e06f76ad2f0713b31335fe5", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.20434190268829666, "ground_truth": 0}, {"key": "39074eb06df4966d1e06f76ad2f0713b31335fe5", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.2254165984036579, "ground_truth": 0}, {"key": "39074eb06df4966d1e06f76ad2f0713b31335fe5", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.3363310587521033, "ground_truth": 0}, {"key": "39074eb06df4966d1e06f76ad2f0713b31335fe5", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.546738155628679, "ground_truth": 0}, {"key": "39074eb06df4966d1e06f76ad2f0713b31335fe5", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.4301473498538968, "ground_truth": 0}, {"key": "3cae0d9bcf97b5d182b20a31aaea3f41cd7bf599", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.19436781821270127, "ground_truth": 0}, {"key": "3cae0d9bcf97b5d182b20a31aaea3f41cd7bf599", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.38121956729989154, "ground_truth": 0}, {"key": "3cae0d9bcf97b5d182b20a31aaea3f41cd7bf599", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.39047585361201426, "ground_truth": 0}, {"key": "3cae0d9bcf97b5d182b20a31aaea3f41cd7bf599", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.16995623120935113, "ground_truth": 0}, {"key": "3cae0d9bcf97b5d182b20a31aaea3f41cd7bf599", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.24077459686423242, "ground_truth": 0}, {"key": "6a9ead70f9423e494c466189bc6d907071547f42", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.4148988297778511, "ground_truth": 0}, {"key": "6a9ead70f9423e494c466189bc6d907071547f42", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.39420093856519534, "ground_truth": 0}, {"key": "6a9ead70f9423e494c466189bc6d907071547f42", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.47852882120515483, "ground_truth": 0}, {"key": "6a9ead70f9423e494c466189bc6d907071547f42", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.511716605879633, "ground_truth": 0}, {"key": "6a9ead70f9423e494c466189bc6d907071547f42", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.4726834777532652, "ground_truth": 0}, {"key": "9a15663058028878027f6aa039fb3185c2ff52c8", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.19072402080757156, "ground_truth": 0}, {"key": "9a15663058028878027f6aa039fb3185c2ff52c8", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.2942149840978165, "ground_truth": 0}, {"key": "9a15663058028878027f6aa039fb3185c2ff52c8", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.1044773208661955, "ground_truth": 0}, {"key": "9a15663058028878027f6aa039fb3185c2ff52c8", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.10230470366751639, "ground_truth": 0}, {"key": "9a15663058028878027f6aa039fb3185c2ff52c8", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.10743747270502028, "ground_truth": 0}, {"key": "83cb0c7e79d4c71703e1bd5fc346fe68be8b8b13", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.4726834562339734, "ground_truth": 0}, {"key": "83cb0c7e79d4c71703e1bd5fc346fe68be8b8b13", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.4455295511626717, "ground_truth": 0}, {"key": "83cb0c7e79d4c71703e1bd5fc346fe68be8b8b13", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.36116471313357873, "ground_truth": 0}, {"key": "83cb0c7e79d4c71703e1bd5fc346fe68be8b8b13", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.6261241858041955, "ground_truth": 0}, {"key": "83cb0c7e79d4c71703e1bd5fc346fe68be8b8b13", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.12421300766484161, "ground_truth": 0}, {"key": "5eb63517219a5d2aeebd21aa66d9b69c52cfb208", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.5964331388145608, "ground_truth": 0}, {"key": "5eb63517219a5d2aeebd21aa66d9b69c52cfb208", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.32252598108713687, "ground_truth": 0}, {"key": "5eb63517219a5d2aeebd21aa66d9b69c52cfb208", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.45907614013809833, "ground_truth": 0}, {"key": "5eb63517219a5d2aeebd21aa66d9b69c52cfb208", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.5, "ground_truth": 0}, {"key": "5eb63517219a5d2aeebd21aa66d9b69c52cfb208", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.5755879979348597, "ground_truth": 0}, {"key": "4a1de02b50578df33ea7b0cb384bdd6aaf4ee119", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.49218813675711887, "ground_truth": 0}, {"key": "4a1de02b50578df33ea7b0cb384bdd6aaf4ee119", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.2751297351085495, "ground_truth": 0}, {"key": "4a1de02b50578df33ea7b0cb384bdd6aaf4ee119", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.3090237078521908, "ground_truth": 0}, {"key": "4a1de02b50578df33ea7b0cb384bdd6aaf4ee119", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.37022538349853296, "ground_truth": 0}, {"key": "4a1de02b50578df33ea7b0cb384bdd6aaf4ee119", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.6636689495881084, "ground_truth": 0}, {"key": "ddedfc2a349fb607ed7efeda1660e9807454ddb7", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.21601153942235063, "ground_truth": 0}, {"key": "ddedfc2a349fb607ed7efeda1660e9807454ddb7", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.5717666003507688, "ground_truth": 0}, {"key": "ddedfc2a349fb607ed7efeda1660e9807454ddb7", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.2613309314906555, "ground_truth": 0}, {"key": "ddedfc2a349fb607ed7efeda1660e9807454ddb7", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.38121956107564453, "ground_truth": 0}, {"key": "ddedfc2a349fb607ed7efeda1660e9807454ddb7", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.16995623369171606, "ground_truth": 0}, {"key": "1cce8238a161fda411022c350d2b9a49072f366f", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.19682621254992264, "ground_truth": 0}, {"key": "1cce8238a161fda411022c350d2b9a49072f366f", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.2925953037861333, "ground_truth": 0}, {"key": "1cce8238a161fda411022c350d2b9a49072f366f", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.21469141682260692, "ground_truth": 0}, {"key": "1cce8238a161fda411022c350d2b9a49072f366f", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.5506073941700662, "ground_truth": 0}, {"key": "1cce8238a161fda411022c350d2b9a49072f366f", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.132066153296138, "ground_truth": 0}, {"key": "0612042c0c7d5cf6459f5435402919673c8c552f", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.33111973008236156, "ground_truth": 0}, {"key": "0612042c0c7d5cf6459f5435402919673c8c552f", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.3398276303451466, "ground_truth": 0}, {"key": "0612042c0c7d5cf6459f5435402919673c8c552f", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.307358008836285, "ground_truth": 0}, {"key": "0612042c0c7d5cf6459f5435402919673c8c552f", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.29098086524504874, "ground_truth": 0}, {"key": "0612042c0c7d5cf6459f5435402919673c8c552f", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.2494472413456929, "ground_truth": 0}, {"key": "cbe1f7ee7f5d619093684cc123e3908e39d79c92", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.5888891311603817, "ground_truth": 0}, {"key": "cbe1f7ee7f5d619093684cc123e3908e39d79c92", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.8019358241336038, "ground_truth": 0}, {"key": "cbe1f7ee7f5d619093684cc123e3908e39d79c92", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.8278281491501582, "ground_truth": 0}, {"key": "cbe1f7ee7f5d619093684cc123e3908e39d79c92", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.869714572691604, "ground_truth": 0}, {"key": "cbe1f7ee7f5d619093684cc123e3908e39d79c92", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.7490872131816307, "ground_truth": 0}, {"key": "42be47d5986a9a55b413eb57359d2d8c51b59024", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.39793842638062915, "ground_truth": 0}, {"key": "42be47d5986a9a55b413eb57359d2d8c51b59024", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.5253688195858105, "ground_truth": 0}, {"key": "42be47d5986a9a55b413eb57359d2d8c51b59024", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.509764370832827, "ground_truth": 0}, {"key": "42be47d5986a9a55b413eb57359d2d8c51b59024", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.7248702638128334, "ground_truth": 0}, {"key": "42be47d5986a9a55b413eb57359d2d8c51b59024", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.3830641950585603, "ground_truth": 0}, {"key": "9f997964709283520a65d2ce75de7c8b154ce351", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.16132023184641017, "ground_truth": 0}, {"key": "9f997964709283520a65d2ce75de7c8b154ce351", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.11201595616265093, "ground_truth": 0}, {"key": "9f997964709283520a65d2ce75de7c8b154ce351", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.15921740872762297, "ground_truth": 0}, {"key": "9f997964709283520a65d2ce75de7c8b154ce351", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.1699562377809424, "ground_truth": 0}, {"key": "9f997964709283520a65d2ce75de7c8b154ce351", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.19559408111034504, "ground_truth": 0}, {"key": "57da930302d81b46438b0f715a5218b7174a5611", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.6039318462882995, "ground_truth": 0}, {"key": "57da930302d81b46438b0f715a5218b7174a5611", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.588889141810904, "ground_truth": 0}, {"key": "57da930302d81b46438b0f715a5218b7174a5611", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.6619228651864678, "ground_truth": 0}, {"key": "57da930302d81b46438b0f715a5218b7174a5611", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.5736783899901206, "ground_truth": 0}, {"key": "57da930302d81b46438b0f715a5218b7174a5611", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.5736783936384277, "ground_truth": 0}, {"key": "bc639974d283826b3b928bf90f0951652db71fd4", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.6909762999053506, "ground_truth": 0}, {"key": "bc639974d283826b3b928bf90f0951652db71fd4", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.5428632641128316, "ground_truth": 0}, {"key": "bc639974d283826b3b928bf90f0951652db71fd4", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.6688802666260709, "ground_truth": 0}, {"key": "bc639974d283826b3b928bf90f0951652db71fd4", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.607663166080978, "ground_truth": 0}, {"key": "bc639974d283826b3b928bf90f0951652db71fd4", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.812867323766733, "ground_truth": 0}, {"key": "304002bc095b57d14b728ccfb8d704ef39f28813", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.35756753132834895, "ground_truth": 0}, {"key": "304002bc095b57d14b728ccfb8d704ef39f28813", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.2393493373973177, "ground_truth": 0}, {"key": "304002bc095b57d14b728ccfb8d704ef39f28813", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.3328523227566768, "ground_truth": 0}, {"key": "304002bc095b57d14b728ccfb8d704ef39f28813", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.44746030761960354, "ground_truth": 0}, {"key": "304002bc095b57d14b728ccfb8d704ef39f28813", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.44746029346237726, "ground_truth": 0}, {"key": "fab941df6ecc8251b49d28715504baf4ac31dcf9", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.409220792066886, "ground_truth": 0}, {"key": "fab941df6ecc8251b49d28715504baf4ac31dcf9", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.42823339931905463, "ground_truth": 0}, {"key": "fab941df6ecc8251b49d28715504baf4ac31dcf9", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.10894504326979279, "ground_truth": 0}, {"key": "fab941df6ecc8251b49d28715504baf4ac31dcf9", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.171061170719385, "ground_truth": 0}, {"key": "fab941df6ecc8251b49d28715504baf4ac31dcf9", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.22000709625940554, "ground_truth": 0}, {"key": "92dec9732f4244771770150d82cd6086f40e5621", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.1710611816812096, "ground_truth": 0}, {"key": "92dec9732f4244771770150d82cd6086f40e5621", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.40922080474689554, "ground_truth": 0}, {"key": "92dec9732f4244771770150d82cd6086f40e5621", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.11201596043421941, "ground_truth": 0}, {"key": "92dec9732f4244771770150d82cd6086f40e5621", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.30239108991581354, "ground_truth": 0}, {"key": "92dec9732f4244771770150d82cd6086f40e5621", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.32766830728665497, "ground_truth": 0}, {"key": "d2ed554726c632af6e2130a580964a261f8c2e60", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.2720245716760846, "ground_truth": 0}, {"key": "d2ed554726c632af6e2130a580964a261f8c2e60", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.1008786176490278, "ground_truth": 0}, {"key": "d2ed554726c632af6e2130a580964a261f8c2e60", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.09009299376770377, "ground_truth": 0}, {"key": "d2ed554726c632af6e2130a580964a261f8c2e60", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.2005576844032512, "ground_truth": 0}, {"key": "d2ed554726c632af6e2130a580964a261f8c2e60", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.18242552867925269, "ground_truth": 0}, {"key": "84ab5256295369509813877f5000bb7e01e7f641", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.4359015103503194, "ground_truth": 0}, {"key": "84ab5256295369509813877f5000bb7e01e7f641", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.5175709063222075, "ground_truth": 0}, {"key": "84ab5256295369509813877f5000bb7e01e7f641", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.6388352622326886, "ground_truth": 0}, {"key": "84ab5256295369509813877f5000bb7e01e7f641", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.3040416700312756, "ground_truth": 0}, {"key": "84ab5256295369509813877f5000bb7e01e7f641", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.533154394155203, "ground_truth": 0}, {"key": "0e3f2fa30b711144fd8e49dedd6c248542a9083c", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.13206615080821998, "ground_truth": 0}, {"key": "0e3f2fa30b711144fd8e49dedd6c248542a9083c", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.5019531261728215, "ground_truth": 0}, {"key": "0e3f2fa30b711144fd8e49dedd6c248542a9083c", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.07159120615165347, "ground_truth": 0}, {"key": "0e3f2fa30b711144fd8e49dedd6c248542a9083c", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.1871326918559907, "ground_truth": 0}, {"key": "0e3f2fa30b711144fd8e49dedd6c248542a9083c", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.35577487430310906, "ground_truth": 0}, {"key": "67ab697c3e2d707e3b7d070199b065b1541c8925", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.3242354091568777, "ground_truth": 0}, {"key": "67ab697c3e2d707e3b7d070199b065b1541c8925", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.3867634515955457, "ground_truth": 0}, {"key": "67ab697c3e2d707e3b7d070199b065b1541c8925", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.4130035841791844, "ground_truth": 0}, {"key": "67ab697c3e2d707e3b7d070199b065b1541c8925", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.17553806274000994, "ground_truth": 0}, {"key": "67ab697c3e2d707e3b7d070199b065b1541c8925", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.511716581249874, "ground_truth": 0}, {"key": "71537a701b69838dcb68ae310c7b3bfb375c1344", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.2267836195702256, "ground_truth": 0}, {"key": "71537a701b69838dcb68ae310c7b3bfb375c1344", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.33633105816133574, "ground_truth": 0}, {"key": "71537a701b69838dcb68ae310c7b3bfb375c1344", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.6791786896764396, "ground_truth": 0}, {"key": "71537a701b69838dcb68ae310c7b3bfb375c1344", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.1311732171243156, "ground_truth": 0}, {"key": "71537a701b69838dcb68ae310c7b3bfb375c1344", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.3575675266861559, "ground_truth": 0}, {"key": "83989da5142972bb45c7f1e25ea60c6b101a9987", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.47463118425497375, "ground_truth": 0}, {"key": "83989da5142972bb45c7f1e25ea60c6b101a9987", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.3665897484040465, "ground_truth": 0}, {"key": "83989da5142972bb45c7f1e25ea60c6b101a9987", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.618780440730308, "ground_truth": 0}, {"key": "83989da5142972bb45c7f1e25ea60c6b101a9987", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.7520125642500243, "ground_truth": 0}, {"key": "83989da5142972bb45c7f1e25ea60c6b101a9987", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.6774740070907947, "ground_truth": 0}, {"key": "cc432e8a26891d7fcb62b112f868e994532a7ba7", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.40922078715360966, "ground_truth": 0}, {"key": "cc432e8a26891d7fcb62b112f868e994532a7ba7", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.5698526427705888, "ground_truth": 0}, {"key": "cc432e8a26891d7fcb62b112f868e994532a7ba7", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.45713674065192894, "ground_truth": 0}, {"key": "cc432e8a26891d7fcb62b112f868e994532a7ba7", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.2829881258700767, "ground_truth": 0}, {"key": "cc432e8a26891d7fcb62b112f868e994532a7ba7", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.8418256491545958, "ground_truth": 0}, {"key": "ef024e4ca04bd445d2915e7fe5c2c3c9b6f723a2", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.348645143706986, "ground_truth": 0}, {"key": "ef024e4ca04bd445d2915e7fe5c2c3c9b6f723a2", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.1581743641682207, "ground_truth": 0}, {"key": "ef024e4ca04bd445d2915e7fe5c2c3c9b6f723a2", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.3775406831786852, "ground_truth": 0}, {"key": "ef024e4ca04bd445d2915e7fe5c2c3c9b6f723a2", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.3225259849343577, "ground_truth": 0}, {"key": "ef024e4ca04bd445d2915e7fe5c2c3c9b6f723a2", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.20307462433258344, "ground_truth": 0}, {"key": "dfc606b97c43ac249d72cff2fe812213987a37a2", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.2479874430259894, "ground_truth": 0}, {"key": "dfc606b97c43ac249d72cff2fe812213987a37a2", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.4980468791360794, "ground_truth": 0}, {"key": "dfc606b97c43ac249d72cff2fe812213987a37a2", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.3415824975776351, "ground_truth": 0}, {"key": "dfc606b97c43ac249d72cff2fe812213987a37a2", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.5602526565087356, "ground_truth": 0}, {"key": "dfc606b97c43ac249d72cff2fe812213987a37a2", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.32594952320406867, "ground_truth": 0}, {"key": "087ac92e2ca469b5ca6277950e63b2f0706d0de2", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.2337063332075362, "ground_truth": 0}, {"key": "087ac92e2ca469b5ca6277950e63b2f0706d0de2", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.27669052961229035, "ground_truth": 0}, {"key": "087ac92e2ca469b5ca6277950e63b2f0706d0de2", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.235108382105899, "ground_truth": 0}, {"key": "087ac92e2ca469b5ca6277950e63b2f0706d0de2", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.4167966449236713, "ground_truth": 0}, {"key": "087ac92e2ca469b5ca6277950e63b2f0706d0de2", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.3522017767773747, "ground_truth": 0}, {"key": "a1abb9ce1c76a6c390233d8ec934cfb34bc35215", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.33111973604672024, "ground_truth": 0}, {"key": "a1abb9ce1c76a6c390233d8ec934cfb34bc35215", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.25982564762951826, "ground_truth": 0}, {"key": "a1abb9ce1c76a6c390233d8ec934cfb34bc35215", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.45519860278109836, "ground_truth": 0}, {"key": "a1abb9ce1c76a6c390233d8ec934cfb34bc35215", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.31405055937069026, "ground_truth": 0}, {"key": "a1abb9ce1c76a6c390233d8ec934cfb34bc35215", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.40922079216026574, "ground_truth": 0}, {"key": "99ec57979392a7f9c1a24158d5e1262cdf113f45", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.6825737281076895, "ground_truth": 0}, {"key": "99ec57979392a7f9c1a24158d5e1262cdf113f45", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.8955226801222016, "ground_truth": 0}, {"key": "99ec57979392a7f9c1a24158d5e1262cdf113f45", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.656658266941002, "ground_truth": 0}, {"key": "99ec57979392a7f9c1a24158d5e1262cdf113f45", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.8031737875058172, "ground_truth": 0}, {"key": "99ec57979392a7f9c1a24158d5e1262cdf113f45", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.8697145802806019, "ground_truth": 0}, {"key": "ca5c0c816376354b82a4a7b9fa9a31b655e2d2cd", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.3849121516913919, "ground_truth": 0}, {"key": "ca5c0c816376354b82a4a7b9fa9a31b655e2d2cd", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.3757064791260975, "ground_truth": 0}, {"key": "ca5c0c816376354b82a4a7b9fa9a31b655e2d2cd", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.41869692640099737, "ground_truth": 0}, {"key": "ca5c0c816376354b82a4a7b9fa9a31b655e2d2cd", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.6261241918848458, "ground_truth": 0}, {"key": "ca5c0c816376354b82a4a7b9fa9a31b655e2d2cd", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.5602526542031487, "ground_truth": 0}, {"key": "e9787bf9462b12b7dfc0b562510a551e7d07b4d7", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.21733752153938468, "ground_truth": 0}, {"key": "e9787bf9462b12b7dfc0b562510a551e7d07b4d7", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.3960681505454708, "ground_truth": 0}, {"key": "e9787bf9462b12b7dfc0b562510a551e7d07b4d7", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.45907613902240724, "ground_truth": 0}, {"key": "e9787bf9462b12b7dfc0b562510a551e7d07b4d7", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.25091279814658224, "ground_truth": 0}, {"key": "e9787bf9462b12b7dfc0b562510a551e7d07b4d7", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.2958398763645776, "ground_truth": 0}, {"key": "ed8a7d5b06b4b5415725e624a15ab5ada7146894", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.5370413844311402, "ground_truth": 0}, {"key": "ed8a7d5b06b4b5415725e624a15ab5ada7146894", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.2643583571234267, "ground_truth": 0}, {"key": "ed8a7d5b06b4b5415725e624a15ab5ada7146894", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.6460136921375171, "ground_truth": 0}, {"key": "ed8a7d5b06b4b5415725e624a15ab5ada7146894", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.3793783917843056, "ground_truth": 0}, {"key": "ed8a7d5b06b4b5415725e624a15ab5ada7146894", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.28298813375722914, "ground_truth": 0}, {"key": "4b6f2532f6bb4cf4ae341e4fb72d384ef58f0f42", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.3923368352622898, "ground_truth": 0}, {"key": "4b6f2532f6bb4cf4ae341e4fb72d384ef58f0f42", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.5660185280942298, "ground_truth": 0}, {"key": "4b6f2532f6bb4cf4ae341e4fb72d384ef58f0f42", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.4746312052968906, "ground_truth": 0}, {"key": "4b6f2532f6bb4cf4ae341e4fb72d384ef58f0f42", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.27512972183515766, "ground_truth": 0}, {"key": "4b6f2532f6bb4cf4ae341e4fb72d384ef58f0f42", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.29910520437322324, "ground_truth": 0}, {"key": "46102a68e2927f930c1c2bd117ca714d188cd1ab", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.19930800450528174, "ground_truth": 0}, {"key": "46102a68e2927f930c1c2bd117ca714d188cd1ab", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.12252321679565815, "ground_truth": 0}, {"key": "46102a68e2927f930c1c2bd117ca714d188cd1ab", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.23934933325708527, "ground_truth": 0}, {"key": "46102a68e2927f930c1c2bd117ca714d188cd1ab", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.21076629436098795, "ground_truth": 0}, {"key": "46102a68e2927f930c1c2bd117ca714d188cd1ab", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.17667160612077581, "ground_truth": 0}, {"key": "ee6568a8880e61a498aab80c41f70939d567c991", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.11047114983288195, "ground_truth": 0}, {"key": "ee6568a8880e61a498aab80c41f70939d567c991", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.07159119773893777, "ground_truth": 0}, {"key": "ee6568a8880e61a498aab80c41f70939d567c991", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.1907240148145212, "ground_truth": 0}, {"key": "ee6568a8880e61a498aab80c41f70939d567c991", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.12002563124893834, "ground_truth": 0}, {"key": "ee6568a8880e61a498aab80c41f70939d567c991", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.3665897355321262, "ground_truth": 0}, {"key": "8f462be265750ebbf85a6ad8ef28cb39c59f826e", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.33633102978035906, "ground_truth": 0}, {"key": "8f462be265750ebbf85a6ad8ef28cb39c59f826e", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.3191214088392427, "ground_truth": 0}, {"key": "8f462be265750ebbf85a6ad8ef28cb39c59f826e", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.2323101416348998, "ground_truth": 0}, {"key": "8f462be265750ebbf85a6ad8ef28cb39c59f826e", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.46295860203431716, "ground_truth": 0}, {"key": "8f462be265750ebbf85a6ad8ef28cb39c59f826e", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.16026603446823356, "ground_truth": 0}, {"key": "b21258342db561f79656c3c75f2e8c8244dd6178", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.5175708812473043, "ground_truth": 0}, {"key": "b21258342db561f79656c3c75f2e8c8244dd6178", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.38306418610547427, "ground_truth": 0}, {"key": "b21258342db561f79656c3c75f2e8c8244dd6178", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.5813030941044537, "ground_truth": 0}, {"key": "b21258342db561f79656c3c75f2e8c8244dd6178", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.1919327944218295, "ground_truth": 0}, {"key": "b21258342db561f79656c3c75f2e8c8244dd6178", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.2509127822780475, "ground_truth": 0}, {"key": "c7b97c7c2ca7b9bedff4978dd3cae9aaef8f8100", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.045352580216526335, "ground_truth": 0}, {"key": "c7b97c7c2ca7b9bedff4978dd3cae9aaef8f8100", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.08389038954715419, "ground_truth": 0}, {"key": "c7b97c7c2ca7b9bedff4978dd3cae9aaef8f8100", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.18713267878331075, "ground_truth": 0}, {"key": "c7b97c7c2ca7b9bedff4978dd3cae9aaef8f8100", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.3106943710252471, "ground_truth": 0}, {"key": "c7b97c7c2ca7b9bedff4978dd3cae9aaef8f8100", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.1955940711977099, "ground_truth": 0}, {"key": "bdbeb9265050f2a4ce200c3802775694b7dc20e6", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.5097643838811526, "ground_truth": 0}, {"key": "bdbeb9265050f2a4ce200c3802775694b7dc20e6", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.654894714975444, "ground_truth": 0}, {"key": "bdbeb9265050f2a4ce200c3802775694b7dc20e6", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.710628311188738, "ground_truth": 0}, {"key": "bdbeb9265050f2a4ce200c3802775694b7dc20e6", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.3611647248077792, "ground_truth": 0}, {"key": "bdbeb9265050f2a4ce200c3802775694b7dc20e6", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.23792989829278682, "ground_truth": 0}, {"key": "42e93d5aef7547b8169f1f6c7735d0265a030580", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.5813030977396427, "ground_truth": 0}, {"key": "42e93d5aef7547b8169f1f6c7735d0265a030580", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.2814056118520705, "ground_truth": 0}, {"key": "42e93d5aef7547b8169f1f6c7735d0265a030580", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.39420096247471714, "ground_truth": 0}, {"key": "42e93d5aef7547b8169f1f6c7735d0265a030580", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.3451052598568934, "ground_truth": 0}, {"key": "42e93d5aef7547b8169f1f6c7735d0265a030580", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.466845594593988, "ground_truth": 0}, {"key": "6e7a607934780f0011aa4e84509314efe15c2685", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.5253688261573859, "ground_truth": 0}, {"key": "6e7a607934780f0011aa4e84509314efe15c2685", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.3647775592012162, "ground_truth": 0}, {"key": "6e7a607934780f0011aa4e84509314efe15c2685", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.5926665905689451, "ground_truth": 0}, {"key": "6e7a607934780f0011aa4e84509314efe15c2685", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.1550784778623191, "ground_truth": 0}, {"key": "6e7a607934780f0011aa4e84509314efe15c2685", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.4378234863492848, "ground_truth": 0}, {"key": "c087e2af172aed145b177c9a1a68029205bc732a", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.08329192788576363, "ground_truth": 0}, {"key": "c087e2af172aed145b177c9a1a68029205bc732a", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.17328820036520473, "ground_truth": 0}, {"key": "c087e2af172aed145b177c9a1a68029205bc732a", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.08945460909764757, "ground_truth": 0}, {"key": "c087e2af172aed145b177c9a1a68029205bc732a", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.18594720336023166, "ground_truth": 0}, {"key": "c087e2af172aed145b177c9a1a68029205bc732a", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.19314736427701548, "ground_truth": 0}, {"key": "40e79de5b7a27d7161b147725936d1d47e45c8f9", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.5583269764337537, "ground_truth": 0}, {"key": "40e79de5b7a27d7161b147725936d1d47e45c8f9", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.5525396989106478, "ground_truth": 0}, {"key": "40e79de5b7a27d7161b147725936d1d47e45c8f9", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.542863291702653, "ground_truth": 0}, {"key": "40e79de5b7a27d7161b147725936d1d47e45c8f9", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.5117165886703956, "ground_truth": 0}, {"key": "40e79de5b7a27d7161b147725936d1d47e45c8f9", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.2704802297576065, "ground_truth": 0}, {"key": "e878909ace599352d3d578796968bbd52cb299bd", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.11838510240108308, "ground_truth": 0}, {"key": "e878909ace599352d3d578796968bbd52cb299bd", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.12940272601290492, "ground_truth": 0}, {"key": "e878909ace599352d3d578796968bbd52cb299bd", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.16776335316998464, "ground_truth": 0}, {"key": "e878909ace599352d3d578796968bbd52cb299bd", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.0775176565802341, "ground_truth": 0}, {"key": "e878909ace599352d3d578796968bbd52cb299bd", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.10302442991234177, "ground_truth": 0}, {"key": "470708aab0fe600a27423bf4a2f8c9860fe5f64b", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.5273165358051979, "ground_truth": 0}, {"key": "470708aab0fe600a27423bf4a2f8c9860fe5f64b", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.6352224454803576, "ground_truth": 0}, {"key": "470708aab0fe600a27423bf4a2f8c9860fe5f64b", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.24077458683366934, "ground_truth": 0}, {"key": "470708aab0fe600a27423bf4a2f8c9860fe5f64b", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.19806416643126107, "ground_truth": 0}, {"key": "470708aab0fe600a27423bf4a2f8c9860fe5f64b", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.5448013930409806, "ground_truth": 0}, {"key": "16e8cb520c874af6825d4661f6127a67efd4b6f6", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.704160130243434, "ground_truth": 0}, {"key": "16e8cb520c874af6825d4661f6127a67efd4b6f6", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.6424324688936625, "ground_truth": 0}, {"key": "16e8cb520c874af6825d4661f6127a67efd4b6f6", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.707404690960245, "ground_truth": 0}, {"key": "16e8cb520c874af6825d4661f6127a67efd4b6f6", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.8068526298476925, "ground_truth": 0}, {"key": "16e8cb520c874af6825d4661f6127a67efd4b6f6", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.7185943940714157, "ground_truth": 0}, {"key": "38673348ff28676905791fe3e8db2bbda814d974", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.2643583661134976, "ground_truth": 0}, {"key": "38673348ff28676905791fe3e8db2bbda814d974", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.18010665784803317, "ground_truth": 0}, {"key": "38673348ff28676905791fe3e8db2bbda814d974", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.18010666022034047, "ground_truth": 0}, {"key": "38673348ff28676905791fe3e8db2bbda814d974", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.17781087825875946, "ground_truth": 0}, {"key": "38673348ff28676905791fe3e8db2bbda814d974", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.10521053747636117, "ground_truth": 0}, {"key": "914a0163e25ecccb635b601837cc4dd552c66ce0", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.3123700095733017, "ground_truth": 0}, {"key": "914a0163e25ecccb635b601837cc4dd552c66ce0", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.4054487377453132, "ground_truth": 0}, {"key": "914a0163e25ecccb635b601837cc4dd552c66ce0", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.36477757594590693, "ground_truth": 0}, {"key": "914a0163e25ecccb635b601837cc4dd552c66ce0", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.31742628114359495, "ground_truth": 0}, {"key": "914a0163e25ecccb635b601837cc4dd552c66ce0", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.4359015263100839, "ground_truth": 0}, {"key": "851c7314af56b6f47742970e11696948323dfe94", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.2583259816637115, "ground_truth": 0}, {"key": "851c7314af56b6f47742970e11696948323dfe94", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.2613309270709673, "ground_truth": 0}, {"key": "851c7314af56b6f47742970e11696948323dfe94", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.31069439617533723, "ground_truth": 0}, {"key": "851c7314af56b6f47742970e11696948323dfe94", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.5621764941094516, "ground_truth": 0}, {"key": "851c7314af56b6f47742970e11696948323dfe94", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.26894144121205865, "ground_truth": 0}, {"key": "f29f04e8f0615b768dd756c4387e87e27b7b4c2d", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.20055769270573334, "ground_truth": 0}, {"key": "f29f04e8f0615b768dd756c4387e87e27b7b4c2d", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.2720245562516665, "ground_truth": 0}, {"key": "f29f04e8f0615b768dd756c4387e87e27b7b4c2d", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.14318770899090105, "ground_truth": 0}, {"key": "f29f04e8f0615b768dd756c4387e87e27b7b4c2d", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.1721718556318216, "ground_truth": 0}, {"key": "f29f04e8f0615b768dd756c4387e87e27b7b4c2d", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.07159120259736224, "ground_truth": 0}, {"key": "8451164e86012e6dbf2fd39f7e6ca784ff9f3624", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.677474013254262, "ground_truth": 0}, {"key": "8451164e86012e6dbf2fd39f7e6ca784ff9f3624", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.8397339666382233, "ground_truth": 0}, {"key": "8451164e86012e6dbf2fd39f7e6ca784ff9f3624", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.33458942919286244, "ground_truth": 0}, {"key": "8451164e86012e6dbf2fd39f7e6ca784ff9f3624", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.4980468490182832, "ground_truth": 0}, {"key": "8451164e86012e6dbf2fd39f7e6ca784ff9f3624", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.3775406556977131, "ground_truth": 0}, {"key": "18765fda59852b1c13eb226a2da9ab0979739f44", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.2925953094934372, "ground_truth": 0}, {"key": "18765fda59852b1c13eb226a2da9ab0979739f44", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.46684558750602917, "ground_truth": 0}, {"key": "18765fda59852b1c13eb226a2da9ab0979739f44", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.49023564007903514, "ground_truth": 0}, {"key": "18765fda59852b1c13eb226a2da9ab0979739f44", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.43206337527609584, "ground_truth": 0}, {"key": "18765fda59852b1c13eb226a2da9ab0979739f44", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.2877678110853689, "ground_truth": 0}, {"key": "fba410776268aaf447802e66ac94e4af54f7cb7a", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.7325918241132637, "ground_truth": 0}, {"key": "fba410776268aaf447802e66ac94e4af54f7cb7a", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.8080672074063346, "ground_truth": 0}, {"key": "fba410776268aaf447802e66ac94e4af54f7cb7a", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.6334102681563023, "ground_truth": 0}, {"key": "fba410776268aaf447802e66ac94e4af54f7cb7a", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.49804685613911287, "ground_truth": 0}, {"key": "fba410776268aaf447802e66ac94e4af54f7cb7a", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.7634837626011234, "ground_truth": 0}, {"key": "31494e5d6eda2042c4793ae68cea4b8304dfa0ad", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.6001883305479222, "ground_truth": 0}, {"key": "31494e5d6eda2042c4793ae68cea4b8304dfa0ad", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.9073122230593551, "ground_truth": 0}, {"key": "31494e5d6eda2042c4793ae68cea4b8304dfa0ad", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.7490872060661641, "ground_truth": 0}, {"key": "31494e5d6eda2042c4793ae68cea4b8304dfa0ad", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.8558511439713736, "ground_truth": 0}, {"key": "31494e5d6eda2042c4793ae68cea4b8304dfa0ad", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.9142907242524551, "ground_truth": 0}, {"key": "564bdb9bbcd2276bdfbdce6eb1e2058f0921bd82", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.21733750771626698, "ground_truth": 0}, {"key": "564bdb9bbcd2276bdfbdce6eb1e2058f0921bd82", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.2735744022284209, "ground_truth": 0}, {"key": "564bdb9bbcd2276bdfbdce6eb1e2058f0921bd82", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.2689414410894338, "ground_truth": 0}, {"key": "564bdb9bbcd2276bdfbdce6eb1e2058f0921bd82", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.11047115021387087, "ground_truth": 0}, {"key": "564bdb9bbcd2276bdfbdce6eb1e2058f0921bd82", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.3276682986154672, "ground_truth": 0}, {"key": "acbacec078274c02aeae06061357d02d950fec33", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.3923368290971917, "ground_truth": 0}, {"key": "acbacec078274c02aeae06061357d02d950fec33", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.4359015058649471, "ground_truth": 0}, {"key": "acbacec078274c02aeae06061357d02d950fec33", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.5583269896993664, "ground_truth": 0}, {"key": "acbacec078274c02aeae06061357d02d950fec33", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.4863315117297679, "ground_truth": 0}, {"key": "acbacec078274c02aeae06061357d02d950fec33", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.49804691117765554, "ground_truth": 0}, {"key": "04327bc3e426eee01ed61d369fd52415aa300ddc", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.43782348717463504, "ground_truth": 0}, {"key": "04327bc3e426eee01ed61d369fd52415aa300ddc", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.38491215428583747, "ground_truth": 0}, {"key": "04327bc3e426eee01ed61d369fd52415aa300ddc", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.6688802608025813, "ground_truth": 0}, {"key": "04327bc3e426eee01ed61d369fd52415aa300ddc", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.3007455858546096, "ground_truth": 0}, {"key": "04327bc3e426eee01ed61d369fd52415aa300ddc", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.35042137709516546, "ground_truth": 0}, {"key": "b1f3d2adb48370e5ecadff8e6e3baff407b01f0e", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.5813030648693249, "ground_truth": 0}, {"key": "b1f3d2adb48370e5ecadff8e6e3baff407b01f0e", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.25982566045645056, "ground_truth": 0}, {"key": "b1f3d2adb48370e5ecadff8e6e3baff407b01f0e", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.29746994376263747, "ground_truth": 0}, {"key": "b1f3d2adb48370e5ecadff8e6e3baff407b01f0e", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.6095241688364793, "ground_truth": 0}, {"key": "b1f3d2adb48370e5ecadff8e6e3baff407b01f0e", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.5019531146384819, "ground_truth": 0}, {"key": "d7eaf2e5ca91bf54c05ead867e5e90728d44e218", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.7154240069812237, "ground_truth": 0}, {"key": "d7eaf2e5ca91bf54c05ead867e5e90728d44e218", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.5214711424795382, "ground_truth": 0}, {"key": "d7eaf2e5ca91bf54c05ead867e5e90728d44e218", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.6706082848922876, "ground_truth": 0}, {"key": "d7eaf2e5ca91bf54c05ead867e5e90728d44e218", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.7416740309691587, "ground_truth": 0}, {"key": "d7eaf2e5ca91bf54c05ead867e5e90728d44e218", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.5945512659537494, "ground_truth": 0}, {"key": "1fcce9f667de2a14d76aaa6cdb3f1e6f7900e463", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.7745833948931538, "ground_truth": 0}, {"key": "1fcce9f667de2a14d76aaa6cdb3f1e6f7900e463", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.667147660496682, "ground_truth": 0}, {"key": "1fcce9f667de2a14d76aaa6cdb3f1e6f7900e463", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.7943849531456216, "ground_truth": 0}, {"key": "1fcce9f667de2a14d76aaa6cdb3f1e6f7900e463", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.7170118647811983, "ground_truth": 0}, {"key": "1fcce9f667de2a14d76aaa6cdb3f1e6f7900e463", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.7799928976960547, "ground_truth": 0}, {"key": "892f75a4d31560b60aa588faa6f4bf51322b8c18", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.6495786107783831, "ground_truth": 0}, {"key": "892f75a4d31560b60aa588faa6f4bf51322b8c18", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.5888891368348157, "ground_truth": 0}, {"key": "892f75a4d31560b60aa588faa6f4bf51322b8c18", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.5117166244241708, "ground_truth": 0}, {"key": "892f75a4d31560b60aa588faa6f4bf51322b8c18", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.6671476766896589, "ground_truth": 0}, {"key": "892f75a4d31560b60aa588faa6f4bf51322b8c18", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.777299850324747, "ground_truth": 0}, {"key": "acf12bd8d1142648b1b522a3a925e14e48b8f068", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.22678362157458287, "ground_truth": 0}, {"key": "acf12bd8d1142648b1b522a3a925e14e48b8f068", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.40922080474689554, "ground_truth": 0}, {"key": "acf12bd8d1142648b1b522a3a925e14e48b8f068", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.0967057870468357, "ground_truth": 0}, {"key": "acf12bd8d1142648b1b522a3a925e14e48b8f068", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.22405545626098258, "ground_truth": 0}, {"key": "acf12bd8d1142648b1b522a3a925e14e48b8f068", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.26894143332546666, "ground_truth": 0}, {"key": "c8caeb08b05cc56e1ac29146793ceb07e4c0de69", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.5755880061473598, "ground_truth": 0}, {"key": "c8caeb08b05cc56e1ac29146793ceb07e4c0de69", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.24077459884130734, "ground_truth": 0}, {"key": "c8caeb08b05cc56e1ac29146793ceb07e4c0de69", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.5851011621877482, "ground_truth": 0}, {"key": "c8caeb08b05cc56e1ac29146793ceb07e4c0de69", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.531209373433262, "ground_truth": 0}, {"key": "c8caeb08b05cc56e1ac29146793ceb07e4c0de69", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.5869964141691478, "ground_truth": 0}, {"key": "ed7ed4440f5f7082230ae745d240350a4f20b8b7", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.16776335378881027, "ground_truth": 0}, {"key": "ed7ed4440f5f7082230ae745d240350a4f20b8b7", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.3380771381187198, "ground_truth": 0}, {"key": "ed7ed4440f5f7082230ae745d240350a4f20b8b7", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.3557748816945949, "ground_truth": 0}, {"key": "ed7ed4440f5f7082230ae745d240350a4f20b8b7", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.23651622914716852, "ground_truth": 0}, {"key": "ed7ed4440f5f7082230ae745d240350a4f20b8b7", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.28457601752702716, "ground_truth": 0}, {"key": "25b7adf8bfe43c2953a874b18c7766370158638a", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.6334102552460111, "ground_truth": 0}, {"key": "25b7adf8bfe43c2953a874b18c7766370158638a", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.5869964260452779, "ground_truth": 0}, {"key": "25b7adf8bfe43c2953a874b18c7766370158638a", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.6654105645683135, "ground_truth": 0}, {"key": "25b7adf8bfe43c2953a874b18c7766370158638a", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.6723316998618204, "ground_truth": 0}, {"key": "25b7adf8bfe43c2953a874b18c7766370158638a", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.9213576172770781, "ground_truth": 0}, {"key": "771c125e3b0c54f1c3367b2857f15d689f081163", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.6020615833495284, "ground_truth": 0}, {"key": "771c125e3b0c54f1c3367b2857f15d689f081163", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.633410255550441, "ground_truth": 0}, {"key": "771c125e3b0c54f1c3367b2857f15d689f081163", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.6001883393276857, "ground_truth": 0}, {"key": "771c125e3b0c54f1c3367b2857f15d689f081163", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.7813306280051246, "ground_truth": 0}, {"key": "771c125e3b0c54f1c3367b2857f15d689f081163", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.6619228662395839, "ground_truth": 0}, {"key": "4ad70f84c363e5b594da00983e2b40600f12ca54", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.37204878670312347, "ground_truth": 0}, {"key": "4ad70f84c363e5b594da00983e2b40600f12ca54", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.5813030610035912, "ground_truth": 0}, {"key": "4ad70f84c363e5b594da00983e2b40600f12ca54", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.3023910910020317, "ground_truth": 0}, {"key": "4ad70f84c363e5b594da00983e2b40600f12ca54", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.42441199224842757, "ground_truth": 0}, {"key": "4ad70f84c363e5b594da00983e2b40600f12ca54", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.32594952767297497, "ground_truth": 0}, {"key": "cbb5654e979eb27e0af71068cd4e4e5191df35ee", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.12168575399982035, "ground_truth": 0}, {"key": "cbb5654e979eb27e0af71068cd4e4e5191df35ee", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.13206615432681007, "ground_truth": 0}, {"key": "cbb5654e979eb27e0af71068cd4e4e5191df35ee", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.04304284689689564, "ground_truth": 0}, {"key": "cbb5654e979eb27e0af71068cd4e4e5191df35ee", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.14903530880904922, "ground_truth": 0}, {"key": "cbb5654e979eb27e0af71068cd4e4e5191df35ee", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.12002562992307866, "ground_truth": 0}, {"key": "bde6b7e505c05a15a9afe44739e7f016ce169735", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.2030746188214147, "ground_truth": 0}, {"key": "bde6b7e505c05a15a9afe44739e7f016ce169735", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.44939264972506704, "ground_truth": 0}, {"key": "bde6b7e505c05a15a9afe44739e7f016ce169735", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.6548947163306944, "ground_truth": 0}, {"key": "bde6b7e505c05a15a9afe44739e7f016ce169735", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.5350984288363989, "ground_truth": 0}, {"key": "bde6b7e505c05a15a9afe44739e7f016ce169735", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.6859494462116889, "ground_truth": 0}, {"key": "abc4744227c6bf0ddbf64cac2269bd4c6d02938b", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.23934935164681334, "ground_truth": 0}, {"key": "abc4744227c6bf0ddbf64cac2269bd4c6d02938b", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.20561504421400714, "ground_truth": 0}, {"key": "abc4744227c6bf0ddbf64cac2269bd4c6d02938b", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.3276683016538108, "ground_truth": 0}, {"key": "abc4744227c6bf0ddbf64cac2269bd4c6d02938b", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.17441027697269704, "ground_truth": 0}, {"key": "abc4744227c6bf0ddbf64cac2269bd4c6d02938b", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.1530421551531292, "ground_truth": 0}, {"key": "f7e5e75031e9f099564ed046bd822ef1bedb3188", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.3242353965670774, "ground_truth": 0}, {"key": "f7e5e75031e9f099564ed046bd822ef1bedb3188", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.37204879123486095, "ground_truth": 0}, {"key": "f7e5e75031e9f099564ed046bd822ef1bedb3188", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.1530421532858906, "ground_truth": 0}, {"key": "f7e5e75031e9f099564ed046bd822ef1bedb3188", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.27202455328188613, "ground_truth": 0}, {"key": "f7e5e75031e9f099564ed046bd822ef1bedb3188", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.14128142379773603, "ground_truth": 0}, {"key": "9a8ee7eb582f293c617eecab5f37374d9400bb04", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.46295862029933477, "ground_truth": 0}, {"key": "9a8ee7eb582f293c617eecab5f37374d9400bb04", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.6859494488190859, "ground_truth": 0}, {"key": "9a8ee7eb582f293c617eecab5f37374d9400bb04", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.7943849596910527, "ground_truth": 0}, {"key": "9a8ee7eb582f293c617eecab5f37374d9400bb04", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.4493926517321801, "ground_truth": 0}, {"key": "9a8ee7eb582f293c617eecab5f37374d9400bb04", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.7325918205308531, "ground_truth": 0}, {"key": "a745e5a95be983cde00f3d472062c0627db3113c", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.17106118161965728, "ground_truth": 0}, {"key": "a745e5a95be983cde00f3d472062c0627db3113c", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.6477982157978674, "ground_truth": 0}, {"key": "a745e5a95be983cde00f3d472062c0627db3113c", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.2379299012997609, "ground_truth": 0}, {"key": "a745e5a95be983cde00f3d472062c0627db3113c", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.20434190056936874, "ground_truth": 0}, {"key": "a745e5a95be983cde00f3d472062c0627db3113c", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.1540575572919973, "ground_truth": 0}, {"key": "698cdb1268d4da1240d7f540bd4a5af4e229d00f", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.7446563536501093, "ground_truth": 0}, {"key": "698cdb1268d4da1240d7f540bd4a5af4e229d00f", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.33982762997879656, "ground_truth": 0}, {"key": "698cdb1268d4da1240d7f540bd4a5af4e229d00f", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.2845760058328853, "ground_truth": 0}, {"key": "698cdb1268d4da1240d7f540bd4a5af4e229d00f", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.6424324714197174, "ground_truth": 0}, {"key": "698cdb1268d4da1240d7f540bd4a5af4e229d00f", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.7106282989918343, "ground_truth": 0}, {"key": "708c903fbf6a7c3c84f84ff34496eb0cb51f44e4", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.2107662891378537, "ground_truth": 0}, {"key": "708c903fbf6a7c3c84f84ff34496eb0cb51f44e4", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.18476751661247554, "ground_truth": 0}, {"key": "708c903fbf6a7c3c84f84ff34496eb0cb51f44e4", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.5409238501332485, "ground_truth": 0}, {"key": "708c903fbf6a7c3c84f84ff34496eb0cb51f44e4", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.24798742895933445, "ground_truth": 0}, {"key": "708c903fbf6a7c3c84f84ff34496eb0cb51f44e4", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.18594719791737577, "ground_truth": 0}, {"key": "26a1bafbde5cc970d5aee024dc8ef418587018a9", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.2081789314346052, "ground_truth": 0}, {"key": "26a1bafbde5cc970d5aee024dc8ef418587018a9", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.5370413869053587, "ground_truth": 0}, {"key": "26a1bafbde5cc970d5aee024dc8ef418587018a9", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.23934933615916137, "ground_truth": 0}, {"key": "26a1bafbde5cc970d5aee024dc8ef418587018a9", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.17781087661411338, "ground_truth": 0}, {"key": "26a1bafbde5cc970d5aee024dc8ef418587018a9", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.22953521115113817, "ground_truth": 0}, {"key": "6832312991fe5d87d0e300374ec7a699a921f06a", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.3007455824800167, "ground_truth": 0}, {"key": "6832312991fe5d87d0e300374ec7a699a921f06a", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.2309197451006908, "ground_truth": 0}, {"key": "6832312991fe5d87d0e300374ec7a699a921f06a", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.08449275348891505, "ground_truth": 0}, {"key": "6832312991fe5d87d0e300374ec7a699a921f06a", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.18594721182310808, "ground_truth": 0}, {"key": "6832312991fe5d87d0e300374ec7a699a921f06a", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.3090237041323036, "ground_truth": 0}, {"key": "9c5d5d672c2549a594b801897a27dde1492e11d5", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.3363310511376193, "ground_truth": 0}, {"key": "9c5d5d672c2549a594b801897a27dde1492e11d5", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.5467381406401295, "ground_truth": 0}, {"key": "9c5d5d672c2549a594b801897a27dde1492e11d5", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.39420094684810236, "ground_truth": 0}, {"key": "9c5d5d672c2549a594b801897a27dde1492e11d5", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.7549149973823588, "ground_truth": 0}, {"key": "9c5d5d672c2549a594b801897a27dde1492e11d5", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.6169358243922717, "ground_truth": 0}, {"key": "c32fa9084fe8cd565890a940794e505d5f7ba4c2", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.7138307731696106, "ground_truth": 0}, {"key": "c32fa9084fe8cd565890a940794e505d5f7ba4c2", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.20561504993292098, "ground_truth": 0}, {"key": "c32fa9084fe8cd565890a940794e505d5f7ba4c2", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.2465333348634848, "ground_truth": 0}, {"key": "c32fa9084fe8cd565890a940794e505d5f7ba4c2", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.5698526425682352, "ground_truth": 0}, {"key": "c32fa9084fe8cd565890a940794e505d5f7ba4c2", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.32082131461083746, "ground_truth": 0}, {"key": "41b5dd6064864c16fbde9b46d37c9f7d9a56e705", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.36296918586575955, "ground_truth": 0}, {"key": "41b5dd6064864c16fbde9b46d37c9f7d9a56e705", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.4130035807416188, "ground_truth": 0}, {"key": "41b5dd6064864c16fbde9b46d37c9f7d9a56e705", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.19072401020122892, "ground_truth": 0}, {"key": "41b5dd6064864c16fbde9b46d37c9f7d9a56e705", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.24798743814732918, "ground_truth": 0}, {"key": "41b5dd6064864c16fbde9b46d37c9f7d9a56e705", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.37937839016127545, "ground_truth": 0}, {"key": "b2d3ba739af767da7aa25c3ba8e1d186168c3394", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.6876299887227518, "ground_truth": 0}, {"key": "b2d3ba739af767da7aa25c3ba8e1d186168c3394", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.4513265214639666, "ground_truth": 0}, {"key": "b2d3ba739af767da7aa25c3ba8e1d186168c3394", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.5506073692077139, "ground_truth": 0}, {"key": "b2d3ba739af767da7aa25c3ba8e1d186168c3394", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.866132507196427, "ground_truth": 0}, {"key": "b2d3ba739af767da7aa25c3ba8e1d186168c3394", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.7620701053850427, "ground_truth": 0}, {"key": "519fd9b5c5ca82979cdfee3c990c3590838d93c7", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.15507847944901365, "ground_truth": 0}, {"key": "519fd9b5c5ca82979cdfee3c990c3590838d93c7", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.8267117929578482, "ground_truth": 0}, {"key": "519fd9b5c5ca82979cdfee3c990c3590838d93c7", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.25386101591767934, "ground_truth": 0}, {"key": "519fd9b5c5ca82979cdfee3c990c3590838d93c7", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.287767813744843, "ground_truth": 0}, {"key": "519fd9b5c5ca82979cdfee3c990c3590838d93c7", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.27669052525266946, "ground_truth": 0}, {"key": "60f518dff20b2936b104035b1fd9584dd7d16def", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.3293917407281919, "ground_truth": 0}, {"key": "60f518dff20b2936b104035b1fd9584dd7d16def", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.2613309397234278, "ground_truth": 0}, {"key": "60f518dff20b2936b104035b1fd9584dd7d16def", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.41111086196103835, "ground_truth": 0}, {"key": "60f518dff20b2936b104035b1fd9584dd7d16def", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.2068940483085315, "ground_truth": 0}, {"key": "60f518dff20b2936b104035b1fd9584dd7d16def", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.2877678070625483, "ground_truth": 0}, {"key": "b82546b760716f0a2b26606b07af0fe0dd61d6ff", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.12765261681317316, "ground_truth": 0}, {"key": "b82546b760716f0a2b26606b07af0fe0dd61d6ff", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.0994702056253313, "ground_truth": 0}, {"key": "b82546b760716f0a2b26606b07af0fe0dd61d6ff", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.1859472071734193, "ground_truth": 0}, {"key": "b82546b760716f0a2b26606b07af0fe0dd61d6ff", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.12085322822125025, "ground_truth": 0}, {"key": "b82546b760716f0a2b26606b07af0fe0dd61d6ff", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.5078118512223783, "ground_truth": 0}, {"key": "7990fde4a924299fab79f6c8e2b447ee5ffcd1fc", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.12678517388388424, "ground_truth": 0}, {"key": "7990fde4a924299fab79f6c8e2b447ee5ffcd1fc", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.27825679759233446, "ground_truth": 0}, {"key": "7990fde4a924299fab79f6c8e2b447ee5ffcd1fc", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.12168575636083771, "ground_truth": 0}, {"key": "7990fde4a924299fab79f6c8e2b447ee5ffcd1fc", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.1159607051980397, "ground_truth": 0}, {"key": "7990fde4a924299fab79f6c8e2b447ee5ffcd1fc", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.13386749311732177, "ground_truth": 0}, {"key": "504f6f6e1aea6bb73c728d12a1342faa6828aace", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.9834704429613285, "ground_truth": 0}, {"key": "504f6f6e1aea6bb73c728d12a1342faa6828aace", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.9929882044380557, "ground_truth": 0}, {"key": "504f6f6e1aea6bb73c728d12a1342faa6828aace", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.9824231154279243, "ground_truth": 0}, {"key": "504f6f6e1aea6bb73c728d12a1342faa6828aace", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.988580385327574, "ground_truth": 0}, {"key": "504f6f6e1aea6bb73c728d12a1342faa6828aace", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.9603611601314139, "ground_truth": 0}, {"key": "ef42653bf9337de184e74be0160b807a41b526fd", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.9458012670421844, "ground_truth": 0}, {"key": "ef42653bf9337de184e74be0160b807a41b526fd", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.9757623653359097, "ground_truth": 0}, {"key": "ef42653bf9337de184e74be0160b807a41b526fd", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.9257686322360482, "ground_truth": 0}, {"key": "ef42653bf9337de184e74be0160b807a41b526fd", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.9603611616599866, "ground_truth": 0}, {"key": "ef42653bf9337de184e74be0160b807a41b526fd", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.9693242010644978, "ground_truth": 0}, {"key": "26d0a5624f3ee7605833c641da5d88e2259b1162", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.4186969344289219, "ground_truth": 0}, {"key": "26d0a5624f3ee7605833c641da5d88e2259b1162", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.41300357554122047, "ground_truth": 0}, {"key": "26d0a5624f3ee7605833c641da5d88e2259b1162", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.27982851070857173, "ground_truth": 0}, {"key": "26d0a5624f3ee7605833c641da5d88e2259b1162", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.1847675016128759, "ground_truth": 0}, {"key": "26d0a5624f3ee7605833c641da5d88e2259b1162", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.24364246771452558, "ground_truth": 0}, {"key": "7e43e9a2c67829721ff9f68147285c579e2c8a70", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.13568953101387457, "ground_truth": 0}, {"key": "7e43e9a2c67829721ff9f68147285c579e2c8a70", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.24220560567052135, "ground_truth": 0}, {"key": "7e43e9a2c67829721ff9f68147285c579e2c8a70", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.1023047173665278, "ground_truth": 0}, {"key": "7e43e9a2c67829721ff9f68147285c579e2c8a70", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.0967057878136918, "ground_truth": 0}, {"key": "7e43e9a2c67829721ff9f68147285c579e2c8a70", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.1655931073731354, "ground_truth": 0}, {"key": "2137ee3e39b5c0d12e17bbd1e10eb75495a3a83b", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.25982563711444745, "ground_truth": 0}, {"key": "2137ee3e39b5c0d12e17bbd1e10eb75495a3a83b", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.7201715017280983, "ground_truth": 0}, {"key": "2137ee3e39b5c0d12e17bbd1e10eb75495a3a83b", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.15203224626533265, "ground_truth": 0}, {"key": "2137ee3e39b5c0d12e17bbd1e10eb75495a3a83b", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.15002882432614287, "ground_truth": 0}, {"key": "2137ee3e39b5c0d12e17bbd1e10eb75495a3a83b", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.3345894333621758, "ground_truth": 0}, {"key": "31defcc44013caae59c0bdbcedd16be150413bd5", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.20434190341426534, "ground_truth": 0}, {"key": "31defcc44013caae59c0bdbcedd16be150413bd5", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.6334102360024065, "ground_truth": 0}, {"key": "31defcc44013caae59c0bdbcedd16be150413bd5", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.583203371971383, "ground_truth": 0}, {"key": "31defcc44013caae59c0bdbcedd16be150413bd5", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.45907613082088444, "ground_truth": 0}, {"key": "31defcc44013caae59c0bdbcedd16be150413bd5", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.29583988787003923, "ground_truth": 0}, {"key": "db73dc3466e4e92672d716c1eb2ac9430ac69951", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.7008947771644403, "ground_truth": 0}, {"key": "db73dc3466e4e92672d716c1eb2ac9430ac69951", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.675764613082392, "ground_truth": 0}, {"key": "db73dc3466e4e92672d716c1eb2ac9430ac69951", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.7074046925899495, "ground_truth": 0}, {"key": "db73dc3466e4e92672d716c1eb2ac9430ac69951", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.7025300469951367, "ground_truth": 0}, {"key": "db73dc3466e4e92672d716c1eb2ac9430ac69951", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.7138307449209863, "ground_truth": 0}, {"key": "3f6308f2f5b6ccdb89d7b6abe1b9490cc30b8e5f", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.22815650592095799, "ground_truth": 0}, {"key": "3f6308f2f5b6ccdb89d7b6abe1b9490cc30b8e5f", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.20817893768856996, "ground_truth": 0}, {"key": "3f6308f2f5b6ccdb89d7b6abe1b9490cc30b8e5f", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.14223188912344925, "ground_truth": 0}, {"key": "3f6308f2f5b6ccdb89d7b6abe1b9490cc30b8e5f", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.203074624732717, "ground_truth": 0}, {"key": "3f6308f2f5b6ccdb89d7b6abe1b9490cc30b8e5f", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.15921740954081048, "ground_truth": 0}, {"key": "068d37f7a1ee822245dbf9d0d8ddfc281919d7ee", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.25683199489776565, "ground_truth": 0}, {"key": "068d37f7a1ee822245dbf9d0d8ddfc281919d7ee", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.5602526710867248, "ground_truth": 0}, {"key": "068d37f7a1ee822245dbf9d0d8ddfc281919d7ee", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.26588046367367296, "ground_truth": 0}, {"key": "068d37f7a1ee822245dbf9d0d8ddfc281919d7ee", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.15405755899703713, "ground_truth": 0}, {"key": "068d37f7a1ee822245dbf9d0d8ddfc281919d7ee", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.4244120055587179, "ground_truth": 0}, {"key": "bb1e2c23f3fc6edb0ee4bed365cb5567c87a5aa9", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.2845760036292101, "ground_truth": 0}, {"key": "bb1e2c23f3fc6edb0ee4bed365cb5567c87a5aa9", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.1112412157486175, "ground_truth": 0}, {"key": "bb1e2c23f3fc6edb0ee4bed365cb5567c87a5aa9", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.22541661409180613, "ground_truth": 0}, {"key": "bb1e2c23f3fc6edb0ee4bed365cb5567c87a5aa9", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.3486451480659478, "ground_truth": 0}, {"key": "bb1e2c23f3fc6edb0ee4bed365cb5567c87a5aa9", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.2553436522844927, "ground_truth": 0}, {"key": "7c72b57e65ddefc77362ed64f7dbc0aebb87ac81", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.8519527958219199, "ground_truth": 0}, {"key": "7c72b57e65ddefc77362ed64f7dbc0aebb87ac81", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.9202179923700511, "ground_truth": 0}, {"key": "7c72b57e65ddefc77362ed64f7dbc0aebb87ac81", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.6619228634147355, "ground_truth": 0}, {"key": "7c72b57e65ddefc77362ed64f7dbc0aebb87ac81", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.7718435185458258, "ground_truth": 0}, {"key": "7c72b57e65ddefc77362ed64f7dbc0aebb87ac81", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.8624675308760006, "ground_truth": 0}, {"key": "37a335b36b8d2472825c4624e5449b995726b7a3", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.1666754053995983, "ground_truth": 0}, {"key": "37a335b36b8d2472825c4624e5449b995726b7a3", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.392336837758286, "ground_truth": 0}, {"key": "37a335b36b8d2472825c4624e5449b995726b7a3", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.1403362445741502, "ground_truth": 0}, {"key": "37a335b36b8d2472825c4624e5449b995726b7a3", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.14903529946182742, "ground_truth": 0}, {"key": "37a335b36b8d2472825c4624e5449b995726b7a3", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.4902356078267121, "ground_truth": 0}, {"key": "da894eb6e5cc104f90ac65e8a124bfcfbfc6578d", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.10017222219753542, "ground_truth": 0}, {"key": "da894eb6e5cc104f90ac65e8a124bfcfbfc6578d", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.1732882070524876, "ground_truth": 0}, {"key": "da894eb6e5cc104f90ac65e8a124bfcfbfc6578d", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.0826973393369618, "ground_truth": 0}, {"key": "da894eb6e5cc104f90ac65e8a124bfcfbfc6578d", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.1602660365142854, "ground_truth": 0}, {"key": "da894eb6e5cc104f90ac65e8a124bfcfbfc6578d", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.09268777860771672, "ground_truth": 0}, {"key": "b7697e424512e656efe5f2aca17bc33cfe0a2b20", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.46101679988338473, "ground_truth": 0}, {"key": "b7697e424512e656efe5f2aca17bc33cfe0a2b20", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.30735802390093947, "ground_truth": 0}, {"key": "b7697e424512e656efe5f2aca17bc33cfe0a2b20", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.4513265214971381, "ground_truth": 0}, {"key": "b7697e424512e656efe5f2aca17bc33cfe0a2b20", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.468790634665679, "ground_truth": 0}, {"key": "b7697e424512e656efe5f2aca17bc33cfe0a2b20", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.39981163874134307, "ground_truth": 0}, {"key": "2292d4348e59aafbe93f3040af23fdff448a6cac", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.36658974543465794, "ground_truth": 0}, {"key": "2292d4348e59aafbe93f3040af23fdff448a6cac", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.7879311963097064, "ground_truth": 0}, {"key": "2292d4348e59aafbe93f3040af23fdff448a6cac", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.7866228389543479, "ground_truth": 0}, {"key": "2292d4348e59aafbe93f3040af23fdff448a6cac", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.3793784073546344, "ground_truth": 0}, {"key": "2292d4348e59aafbe93f3040af23fdff448a6cac", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.5525397071387279, "ground_truth": 0}, {"key": "8ed7e0c5e15275537f2c1d5d945e95709d7dc6bf", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.12168575701653747, "ground_truth": 0}, {"key": "8ed7e0c5e15275537f2c1d5d945e95709d7dc6bf", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.18010666589906388, "ground_truth": 0}, {"key": "8ed7e0c5e15275537f2c1d5d945e95709d7dc6bf", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.24944723723677006, "ground_truth": 0}, {"key": "8ed7e0c5e15275537f2c1d5d945e95709d7dc6bf", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.1276526251434384, "ground_truth": 0}, {"key": "8ed7e0c5e15275537f2c1d5d945e95709d7dc6bf", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.09739040218773881, "ground_truth": 0}, {"key": "6b22be31a2cefb2fdd302b8ff788335f23f5dbad", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.3157359837618292, "ground_truth": 0}, {"key": "6b22be31a2cefb2fdd302b8ff788335f23f5dbad", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.28616926355586597, "ground_truth": 0}, {"key": "6b22be31a2cefb2fdd302b8ff788335f23f5dbad", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.26894144205988335, "ground_truth": 0}, {"key": "6b22be31a2cefb2fdd302b8ff788335f23f5dbad", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.24653334868486737, "ground_truth": 0}, {"key": "6b22be31a2cefb2fdd302b8ff788335f23f5dbad", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.15304214861971685, "ground_truth": 0}, {"key": "686caba1039a286aca406e0bbac00aebb198fda5", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.5117166044018134, "ground_truth": 0}, {"key": "686caba1039a286aca406e0bbac00aebb198fda5", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.567936600783198, "ground_truth": 0}, {"key": "686caba1039a286aca406e0bbac00aebb198fda5", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.5350984464649812, "ground_truth": 0}, {"key": "686caba1039a286aca406e0bbac00aebb198fda5", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.34687307624383235, "ground_truth": 0}, {"key": "686caba1039a286aca406e0bbac00aebb198fda5", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.17781087302457044, "ground_truth": 0}, {"key": "3c84e13d5941fdbe626183cdf1dca9b5df6c8f92", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.379378391190393, "ground_truth": 0}, {"key": "3c84e13d5941fdbe626183cdf1dca9b5df6c8f92", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.2782567866227968, "ground_truth": 0}, {"key": "3c84e13d5941fdbe626183cdf1dca9b5df6c8f92", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.6001883724611514, "ground_truth": 0}, {"key": "3c84e13d5941fdbe626183cdf1dca9b5df6c8f92", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.34510527880155845, "ground_truth": 0}, {"key": "3c84e13d5941fdbe626183cdf1dca9b5df6c8f92", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.5292634108231986, "ground_truth": 0}, {"key": "7f5fd7614f32586747f65545bebba418c3679d12", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.5486735098529993, "ground_truth": 0}, {"key": "7f5fd7614f32586747f65545bebba418c3679d12", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.3293917297057757, "ground_truth": 0}, {"key": "7f5fd7614f32586747f65545bebba418c3679d12", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.6688802606120217, "ground_truth": 0}, {"key": "7f5fd7614f32586747f65545bebba418c3679d12", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.32594951867855, "ground_truth": 0}, {"key": "7f5fd7614f32586747f65545bebba418c3679d12", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.6388352903752583, "ground_truth": 0}, {"key": "186210bbc060c272ff9a2412ec2e711a3e4a5e6e", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.45519860873712914, "ground_truth": 0}, {"key": "186210bbc060c272ff9a2412ec2e711a3e4a5e6e", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.6671476666443432, "ground_truth": 0}, {"key": "186210bbc060c272ff9a2412ec2e711a3e4a5e6e", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.6001883554400438, "ground_truth": 0}, {"key": "186210bbc060c272ff9a2412ec2e711a3e4a5e6e", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.6169358248343473, "ground_truth": 0}, {"key": "186210bbc060c272ff9a2412ec2e711a3e4a5e6e", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.4339814538886359, "ground_truth": 0}, {"key": "03392835ea832d7940082c421a21778c70701ff0", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.4610167980140733, "ground_truth": 0}, {"key": "03392835ea832d7940082c421a21778c70701ff0", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.6671476666443432, "ground_truth": 0}, {"key": "03392835ea832d7940082c421a21778c70701ff0", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.2704802175228652, "ground_truth": 0}, {"key": "03392835ea832d7940082c421a21778c70701ff0", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.37204878862419555, "ground_truth": 0}, {"key": "03392835ea832d7940082c421a21778c70701ff0", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.567936623239058, "ground_truth": 0}, {"key": "e2b96982b60cbd10b39c1db4282023d0ac1f3f2a", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.2643583715042711, "ground_truth": 0}, {"key": "e2b96982b60cbd10b39c1db4282023d0ac1f3f2a", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.4225046093512108, "ground_truth": 0}, {"key": "e2b96982b60cbd10b39c1db4282023d0ac1f3f2a", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.5078118659741204, "ground_truth": 0}, {"key": "e2b96982b60cbd10b39c1db4282023d0ac1f3f2a", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.18359363003698695, "ground_truth": 0}, {"key": "e2b96982b60cbd10b39c1db4282023d0ac1f3f2a", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.15304215240043245, "ground_truth": 0}, {"key": "31310358d02c98abba71916e8cb4ef7477a2d82a", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.21206881350620368, "ground_truth": 0}, {"key": "31310358d02c98abba71916e8cb4ef7477a2d82a", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.6187804566590853, "ground_truth": 0}, {"key": "31310358d02c98abba71916e8cb4ef7477a2d82a", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.13568954597305247, "ground_truth": 0}, {"key": "31310358d02c98abba71916e8cb4ef7477a2d82a", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.2509127850355369, "ground_truth": 0}, {"key": "31310358d02c98abba71916e8cb4ef7477a2d82a", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.4980468996060073, "ground_truth": 0}, {"key": "ec0e9a0c77bbb4bba73ef5177413c666e691850d", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.5467381563737485, "ground_truth": 0}, {"key": "ec0e9a0c77bbb4bba73ef5177413c666e691850d", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.7879311963097064, "ground_truth": 0}, {"key": "ec0e9a0c77bbb4bba73ef5177413c666e691850d", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.3363310557138611, "ground_truth": 0}, {"key": "ec0e9a0c77bbb4bba73ef5177413c666e691850d", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.4863315249254946, "ground_truth": 0}, {"key": "ec0e9a0c77bbb4bba73ef5177413c666e691850d", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.6601723632915539, "ground_truth": 0}, {"key": "02311be4aab97a81d2262963896b975c27f6503d", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.18952109340025183, "ground_truth": 0}, {"key": "02311be4aab97a81d2262963896b975c27f6503d", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.3040416788149615, "ground_truth": 0}, {"key": "02311be4aab97a81d2262963896b975c27f6503d", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.27982850468477566, "ground_truth": 0}, {"key": "02311be4aab97a81d2262963896b975c27f6503d", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.5907792172987294, "ground_truth": 0}, {"key": "02311be4aab97a81d2262963896b975c27f6503d", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.3923368416542728, "ground_truth": 0}, {"key": "a18b463219c663ef55a0cbbf81ae489cdf877b62", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.4649015820802635, "ground_truth": 0}, {"key": "a18b463219c663ef55a0cbbf81ae489cdf877b62", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.9704646633496928, "ground_truth": 0}, {"key": "a18b463219c663ef55a0cbbf81ae489cdf877b62", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.8322366582306807, "ground_truth": 0}, {"key": "a18b463219c663ef55a0cbbf81ae489cdf877b62", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.7138307302673578, "ground_truth": 0}, {"key": "a18b463219c663ef55a0cbbf81ae489cdf877b62", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.5907792099275783, "ground_truth": 0}, {"key": "aa966ac9e3611ac2cef8d3fb9ceb3b58c150e238", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.8233283807244157, "ground_truth": 0}, {"key": "aa966ac9e3611ac2cef8d3fb9ceb3b58c150e238", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.8824278763186488, "ground_truth": 0}, {"key": "aa966ac9e3611ac2cef8d3fb9ceb3b58c150e238", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.7799929008521831, "ground_truth": 0}, {"key": "aa966ac9e3611ac2cef8d3fb9ceb3b58c150e238", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.7676898370006054, "ground_truth": 0}, {"key": "aa966ac9e3611ac2cef8d3fb9ceb3b58c150e238", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.8587185817649143, "ground_truth": 0}, {"key": "5215d4e6e945ba390786f1720cc5a8abf92c32fd", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.30074558549205577, "ground_truth": 0}, {"key": "5215d4e6e945ba390786f1720cc5a8abf92c32fd", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.3242354043920728, "ground_truth": 0}, {"key": "5215d4e6e945ba390786f1720cc5a8abf92c32fd", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.3363310878791119, "ground_truth": 0}, {"key": "5215d4e6e945ba390786f1720cc5a8abf92c32fd", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.2422056248219904, "ground_truth": 0}, {"key": "5215d4e6e945ba390786f1720cc5a8abf92c32fd", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.24077458148555378, "ground_truth": 0}, {"key": "e7297f59909379c8eb07ea9bc2377b5e3980073d", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.2909808674193399, "ground_truth": 0}, {"key": "e7297f59909379c8eb07ea9bc2377b5e3980073d", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.392336837758286, "ground_truth": 0}, {"key": "e7297f59909379c8eb07ea9bc2377b5e3980073d", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.3793783977944001, "ground_truth": 0}, {"key": "e7297f59909379c8eb07ea9bc2377b5e3980073d", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.28776782048965477, "ground_truth": 0}, {"key": "e7297f59909379c8eb07ea9bc2377b5e3980073d", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.4902356078267121, "ground_truth": 0}, {"key": "6c5f775006a225e617c1fa4cf0c439579e1443a2", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.5312093703317067, "ground_truth": 0}, {"key": "6c5f775006a225e617c1fa4cf0c439579e1443a2", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.36296919399840394, "ground_truth": 0}, {"key": "6c5f775006a225e617c1fa4cf0c439579e1443a2", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.4824291095108379, "ground_truth": 0}, {"key": "6c5f775006a225e617c1fa4cf0c439579e1443a2", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.523420350885231, "ground_truth": 0}, {"key": "6c5f775006a225e617c1fa4cf0c439579e1443a2", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.37204877589644236, "ground_truth": 0}, {"key": "46ce664a42eac4474d25c435a28790ec25137603", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.4902356269309391, "ground_truth": 0}, {"key": "46ce664a42eac4474d25c435a28790ec25137603", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.29583986696343695, "ground_truth": 0}, {"key": "46ce664a42eac4474d25c435a28790ec25137603", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.20689406491022233, "ground_truth": 0}, {"key": "46ce664a42eac4474d25c435a28790ec25137603", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.44746029284799854, "ground_truth": 0}, {"key": "46ce664a42eac4474d25c435a28790ec25137603", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.15610489318483683, "ground_truth": 0}, {"key": "693d73ab049f7d8f3c897922b3f7269a96a1a4fa", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.39606818726922904, "ground_truth": 0}, {"key": "693d73ab049f7d8f3c897922b3f7269a96a1a4fa", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.5214711728644729, "ground_truth": 0}, {"key": "693d73ab049f7d8f3c897922b3f7269a96a1a4fa", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.26740814425968534, "ground_truth": 0}, {"key": "693d73ab049f7d8f3c897922b3f7269a96a1a4fa", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.3504213706471617, "ground_truth": 0}, {"key": "693d73ab049f7d8f3c897922b3f7269a96a1a4fa", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.3757064898160731, "ground_truth": 0}, {"key": "48e4930e3c380330b609f460f11520be0e29d5fd", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.28776781255793704, "ground_truth": 0}, {"key": "48e4930e3c380330b609f460f11520be0e29d5fd", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.6671476652639025, "ground_truth": 0}, {"key": "48e4930e3c380330b609f460f11520be0e29d5fd", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.5350984253451552, "ground_truth": 0}, {"key": "48e4930e3c380330b609f460f11520be0e29d5fd", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.4941408950066563, "ground_truth": 0}, {"key": "48e4930e3c380330b609f460f11520be0e29d5fd", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.5428632729743914, "ground_truth": 0}, {"key": "53f3e11ada213ff55b987692a2eb0c9b6d890d5e", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.4532618315354602, "ground_truth": 0}, {"key": "53f3e11ada213ff55b987692a2eb0c9b6d890d5e", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.1530421452222814, "ground_truth": 0}, {"key": "53f3e11ada213ff55b987692a2eb0c9b6d890d5e", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.3415824788271928, "ground_truth": 0}, {"key": "53f3e11ada213ff55b987692a2eb0c9b6d890d5e", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.3867634600070093, "ground_truth": 0}, {"key": "53f3e11ada213ff55b987692a2eb0c9b6d890d5e", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.19314738702265946, "ground_truth": 0}, {"key": "d2ee859acf7e35bea229f968d53240c2f1c2845c", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.20817893534823903, "ground_truth": 0}, {"key": "d2ee859acf7e35bea229f968d53240c2f1c2845c", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.3208212986979201, "ground_truth": 0}, {"key": "d2ee859acf7e35bea229f968d53240c2f1c2845c", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.18010666802969044, "ground_truth": 0}, {"key": "d2ee859acf7e35bea229f968d53240c2f1c2845c", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.2628418597709587, "ground_truth": 0}, {"key": "d2ee859acf7e35bea229f968d53240c2f1c2845c", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.28616923590646864, "ground_truth": 0}, {"key": "d4d44650eb77504fd01a730c0ccc7e6cdfcc578a", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.3345894410974474, "ground_truth": 0}, {"key": "d4d44650eb77504fd01a730c0ccc7e6cdfcc578a", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.29583988213324464, "ground_truth": 0}, {"key": "d4d44650eb77504fd01a730c0ccc7e6cdfcc578a", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.2598256438148453, "ground_truth": 0}, {"key": "d4d44650eb77504fd01a730c0ccc7e6cdfcc578a", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.2991051993627766, "ground_truth": 0}, {"key": "d4d44650eb77504fd01a730c0ccc7e6cdfcc578a", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.2909808691909557, "ground_truth": 0}, {"key": "3695132378151f89d210da575bfef0a3f29aa051", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.646013714506558, "ground_truth": 0}, {"key": "3695132378151f89d210da575bfef0a3f29aa051", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.7866227985713211, "ground_truth": 0}, {"key": "3695132378151f89d210da575bfef0a3f29aa051", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.5156199211722825, "ground_truth": 0}, {"key": "3695132378151f89d210da575bfef0a3f29aa051", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.7690802335469025, "ground_truth": 0}, {"key": "3695132378151f89d210da575bfef0a3f29aa051", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.7956580993408211, "ground_truth": 0}, {"key": "c193cecd478fa204b16500ece25bf25b75bc5265", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.2991052002921508, "ground_truth": 0}, {"key": "c193cecd478fa204b16500ece25bf25b75bc5265", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.4804786874680279, "ground_truth": 0}, {"key": "c193cecd478fa204b16500ece25bf25b75bc5265", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.30074560157614877, "ground_truth": 0}, {"key": "c193cecd478fa204b16500ece25bf25b75bc5265", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.12940273110794467, "ground_truth": 0}, {"key": "c193cecd478fa204b16500ece25bf25b75bc5265", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.3328523401586603, "ground_truth": 0}, {"key": "b599d61b0c28b86dc92c7af4d40814ece8279500", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.23651623634331256, "ground_truth": 0}, {"key": "b599d61b0c28b86dc92c7af4d40814ece8279500", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.4765796818697888, "ground_truth": 0}, {"key": "b599d61b0c28b86dc92c7af4d40814ece8279500", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.4016878000803456, "ground_truth": 0}, {"key": "b599d61b0c28b86dc92c7af4d40814ece8279500", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.2814056100578624, "ground_truth": 0}, {"key": "b599d61b0c28b86dc92c7af4d40814ece8279500", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.15102779973665495, "ground_truth": 0}, {"key": "06f290a163e81c46437ca61b5fd13741d7db11f2", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.36840570042730614, "ground_truth": 0}, {"key": "06f290a163e81c46437ca61b5fd13741d7db11f2", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.3123700033812286, "ground_truth": 0}, {"key": "06f290a163e81c46437ca61b5fd13741d7db11f2", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.325949533342453, "ground_truth": 0}, {"key": "06f290a163e81c46437ca61b5fd13741d7db11f2", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.4339814610737947, "ground_truth": 0}, {"key": "06f290a163e81c46437ca61b5fd13741d7db11f2", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.401687798692606, "ground_truth": 0}, {"key": "46210bd0b15cd5bba64751d873674766decb2677", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.5058591056815646, "ground_truth": 0}, {"key": "46210bd0b15cd5bba64751d873674766decb2677", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.8311430382735299, "ground_truth": 0}, {"key": "46210bd0b15cd5bba64751d873674766decb2677", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.6992544153145215, "ground_truth": 0}, {"key": "46210bd0b15cd5bba64751d873674766decb2677", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.5851011741866301, "ground_truth": 0}, {"key": "46210bd0b15cd5bba64751d873674766decb2677", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.7799929029614712, "ground_truth": 0}, {"key": "cfba701dad16c47e0f7b97b8a6b043d25f740085", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.36658973993298205, "ground_truth": 0}, {"key": "cfba701dad16c47e0f7b97b8a6b043d25f740085", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.31405055792498277, "ground_truth": 0}, {"key": "cfba701dad16c47e0f7b97b8a6b043d25f740085", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.685949454010716, "ground_truth": 0}, {"key": "cfba701dad16c47e0f7b97b8a6b043d25f740085", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.3998116543683395, "ground_truth": 0}, {"key": "cfba701dad16c47e0f7b97b8a6b043d25f740085", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.36296918191368577, "ground_truth": 0}, {"key": "1c0fbe7e6758334d83d145580688e7aa1c549c53", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.29746994344126904, "ground_truth": 0}, {"key": "1c0fbe7e6758334d83d145580688e7aa1c549c53", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.2925953111065703, "ground_truth": 0}, {"key": "1c0fbe7e6758334d83d145580688e7aa1c549c53", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.2782568067402475, "ground_truth": 0}, {"key": "1c0fbe7e6758334d83d145580688e7aa1c549c53", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.31912139688377794, "ground_truth": 0}, {"key": "1c0fbe7e6758334d83d145580688e7aa1c549c53", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.37937841118620075, "ground_truth": 0}, {"key": "820c917dada8b32be365eaeec9edc1ca5833cfcd", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.7090191375216255, "ground_truth": 0}, {"key": "820c917dada8b32be365eaeec9edc1ca5833cfcd", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.422504627245868, "ground_truth": 0}, {"key": "820c917dada8b32be365eaeec9edc1ca5833cfcd", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.7217432430284663, "ground_truth": 0}, {"key": "820c917dada8b32be365eaeec9edc1ca5833cfcd", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.6315942974367809, "ground_truth": 0}, {"key": "820c917dada8b32be365eaeec9edc1ca5833cfcd", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.5253688179571869, "ground_truth": 0}, {"key": "faf3821150b0c63290cbbddd7a8b54900995ea5a", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.11920291606875047, "ground_truth": 0}, {"key": "faf3821150b0c63290cbbddd7a8b54900995ea5a", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.15102781361379616, "ground_truth": 0}, {"key": "faf3821150b0c63290cbbddd7a8b54900995ea5a", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.09334687953658921, "ground_truth": 0}, {"key": "faf3821150b0c63290cbbddd7a8b54900995ea5a", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.11920291890888317, "ground_truth": 0}, {"key": "faf3821150b0c63290cbbddd7a8b54900995ea5a", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.27825680518054957, "ground_truth": 0}, {"key": "1de0cae2832cf41f49e6fad8254247c789dfabd2", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.48633149656820257, "ground_truth": 0}, {"key": "1de0cae2832cf41f49e6fad8254247c789dfabd2", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.6531269074304532, "ground_truth": 0}, {"key": "1de0cae2832cf41f49e6fad8254247c789dfabd2", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.5945512841908079, "ground_truth": 0}, {"key": "1de0cae2832cf41f49e6fad8254247c789dfabd2", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.4148988473070675, "ground_truth": 0}, {"key": "1de0cae2832cf41f49e6fad8254247c789dfabd2", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.515619921667919, "ground_truth": 0}, {"key": "6c6e51ef20def117ed9114ed8d8480b3a100f1c3", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.40356683763109724, "ground_truth": 0}, {"key": "6c6e51ef20def117ed9114ed8d8480b3a100f1c3", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.6636689561062245, "ground_truth": 0}, {"key": "6c6e51ef20def117ed9114ed8d8480b3a100f1c3", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.38861800175369027, "ground_truth": 0}, {"key": "6c6e51ef20def117ed9114ed8d8480b3a100f1c3", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.4649015764807478, "ground_truth": 0}, {"key": "6c6e51ef20def117ed9114ed8d8480b3a100f1c3", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.6076631540233642, "ground_truth": 0}, {"key": "b8c755b8921f7917d161605d2ef404d9551f3846", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.39233683165365263, "ground_truth": 0}, {"key": "b8c755b8921f7917d161605d2ef404d9551f3846", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.15817435730601906, "ground_truth": 0}, {"key": "b8c755b8921f7917d161605d2ef404d9551f3846", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.3886180275120737, "ground_truth": 0}, {"key": "b8c755b8921f7917d161605d2ef404d9551f3846", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.3380771360878743, "ground_truth": 0}, {"key": "b8c755b8921f7917d161605d2ef404d9551f3846", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.48633152383276135, "ground_truth": 0}, {"key": "dc7e18d14b8ad29abbd79f554324ec7b8ba8b9c0", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.7563575403931315, "ground_truth": 0}, {"key": "dc7e18d14b8ad29abbd79f554324ec7b8ba8b9c0", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.8652240840594038, "ground_truth": 0}, {"key": "dc7e18d14b8ad29abbd79f554324ec7b8ba8b9c0", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.779992898515658, "ground_truth": 0}, {"key": "dc7e18d14b8ad29abbd79f554324ec7b8ba8b9c0", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.7074046862186458, "ground_truth": 0}, {"key": "dc7e18d14b8ad29abbd79f554324ec7b8ba8b9c0", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.8824278627206701, "ground_truth": 0}, {"key": "a7fc90db6c296663b1b7fc057451dfd45019342d", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.17667160350837122, "ground_truth": 0}, {"key": "a7fc90db6c296663b1b7fc057451dfd45019342d", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.4687906239263859, "ground_truth": 0}, {"key": "a7fc90db6c296663b1b7fc057451dfd45019342d", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.10669059991512267, "ground_truth": 0}, {"key": "a7fc90db6c296663b1b7fc057451dfd45019342d", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.28937169907333615, "ground_truth": 0}, {"key": "a7fc90db6c296663b1b7fc057451dfd45019342d", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.057918086187332046, "ground_truth": 0}, {"key": "7f22fbc4fd81e50c632c5853856965aa4d0065d4", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.36840571340110134, "ground_truth": 0}, {"key": "7f22fbc4fd81e50c632c5853856965aa4d0065d4", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.7416740168024785, "ground_truth": 0}, {"key": "7f22fbc4fd81e50c632c5853856965aa4d0065d4", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.3738758135487487, "ground_truth": 0}, {"key": "7f22fbc4fd81e50c632c5853856965aa4d0065d4", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.5, "ground_truth": 0}, {"key": "7f22fbc4fd81e50c632c5853856965aa4d0065d4", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.4148988355875336, "ground_truth": 0}, {"key": "309ae632df7b88a9569d81fa91aff3b9fb03529e", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.4016878121872376, "ground_truth": 0}, {"key": "309ae632df7b88a9569d81fa91aff3b9fb03529e", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.42441198971506167, "ground_truth": 0}, {"key": "309ae632df7b88a9569d81fa91aff3b9fb03529e", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.4765796398010469, "ground_truth": 0}, {"key": "309ae632df7b88a9569d81fa91aff3b9fb03529e", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.29910518816812265, "ground_truth": 0}, {"key": "309ae632df7b88a9569d81fa91aff3b9fb03529e", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.28298813118802085, "ground_truth": 0}, {"key": "732304a0901ff14d023d4361c1d41a85724808f3", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.41679663866140554, "ground_truth": 0}, {"key": "732304a0901ff14d023d4361c1d41a85724808f3", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.47852881994834534, "ground_truth": 0}, {"key": "732304a0901ff14d023d4361c1d41a85724808f3", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.1451153645597592, "ground_truth": 0}, {"key": "732304a0901ff14d023d4361c1d41a85724808f3", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.28776781473305074, "ground_truth": 0}, {"key": "732304a0901ff14d023d4361c1d41a85724808f3", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.3998116594522862, "ground_truth": 0}, {"key": "509b9f69b376e4acb8da49d53198699b1e779ea7", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.09467770621534449, "ground_truth": 0}, {"key": "509b9f69b376e4acb8da49d53198699b1e779ea7", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.14318770813655005, "ground_truth": 0}, {"key": "509b9f69b376e4acb8da49d53198699b1e779ea7", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.18832398382077065, "ground_truth": 0}, {"key": "509b9f69b376e4acb8da49d53198699b1e779ea7", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.1530421618150562, "ground_truth": 0}, {"key": "509b9f69b376e4acb8da49d53198699b1e779ea7", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.08632347578187838, "ground_truth": 0}, {"key": "c292860b41f7c9131458cdc44a79febef38ad8a2", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.5428632927349812, "ground_truth": 0}, {"key": "c292860b41f7c9131458cdc44a79febef38ad8a2", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.5602526466433793, "ground_truth": 0}, {"key": "c292860b41f7c9131458cdc44a79febef38ad8a2", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.3007455864792718, "ground_truth": 0}, {"key": "c292860b41f7c9131458cdc44a79febef38ad8a2", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.5583270073228284, "ground_truth": 0}, {"key": "c292860b41f7c9131458cdc44a79febef38ad8a2", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.65135485753916, "ground_truth": 0}, {"key": "6db7e70883f0241081833487c421bab86fdac26e", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.16885695634006095, "ground_truth": 0}, {"key": "6db7e70883f0241081833487c421bab86fdac26e", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.23091974907660573, "ground_truth": 0}, {"key": "6db7e70883f0241081833487c421bab86fdac26e", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.33982761900805275, "ground_truth": 0}, {"key": "6db7e70883f0241081833487c421bab86fdac26e", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.22000710433464352, "ground_truth": 0}, {"key": "6db7e70883f0241081833487c421bab86fdac26e", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.34158251269092665, "ground_truth": 0}, {"key": "e51e06234b3f49da16fec69aaee6fb9cd09cb1d8", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.2925952850641728, "ground_truth": 0}, {"key": "e51e06234b3f49da16fec69aaee6fb9cd09cb1d8", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.24944724366557192, "ground_truth": 0}, {"key": "e51e06234b3f49da16fec69aaee6fb9cd09cb1d8", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.2613309318218689, "ground_truth": 0}, {"key": "e51e06234b3f49da16fec69aaee6fb9cd09cb1d8", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.24508500695387242, "ground_truth": 0}, {"key": "e51e06234b3f49da16fec69aaee6fb9cd09cb1d8", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.21733750659640863, "ground_truth": 0}, {"key": "42474528588bac3a27842671a3fa940fed450552", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.5983121972982837, "ground_truth": 0}, {"key": "42474528588bac3a27842671a3fa940fed450552", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.44360043199690485, "ground_truth": 0}, {"key": "42474528588bac3a27842671a3fa940fed450552", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.6909763009691409, "ground_truth": 0}, {"key": "42474528588bac3a27842671a3fa940fed450552", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.5698526632782162, "ground_truth": 0}, {"key": "42474528588bac3a27842671a3fa940fed450552", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.7446563511943762, "ground_truth": 0}, {"key": "5932d9c8f1da55bad396197ebae0853c515180a5", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.49609382612777786, "ground_truth": 0}, {"key": "5932d9c8f1da55bad396197ebae0853c515180a5", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.33982763205638306, "ground_truth": 0}, {"key": "5932d9c8f1da55bad396197ebae0853c515180a5", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.4359015401124734, "ground_truth": 0}, {"key": "5932d9c8f1da55bad396197ebae0853c515180a5", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.19930800904882945, "ground_truth": 0}, {"key": "5932d9c8f1da55bad396197ebae0853c515180a5", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.4571367334583517, "ground_truth": 0}, {"key": "daacc676fc659bfd147d11b1409ab42615a2f169", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.2845760009081811, "ground_truth": 0}, {"key": "daacc676fc659bfd147d11b1409ab42615a2f169", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.24077460277911092, "ground_truth": 0}, {"key": "daacc676fc659bfd147d11b1409ab42615a2f169", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.2925953154881887, "ground_truth": 0}, {"key": "daacc676fc659bfd147d11b1409ab42615a2f169", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.1008786204867526, "ground_truth": 0}, {"key": "daacc676fc659bfd147d11b1409ab42615a2f169", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.19682620892575275, "ground_truth": 0}, {"key": "7a02e707b139791920fb13115d6132541fff7d97", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.39793840254442914, "ground_truth": 0}, {"key": "7a02e707b139791920fb13115d6132541fff7d97", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.10447731962033212, "ground_truth": 0}, {"key": "7a02e707b139791920fb13115d6132541fff7d97", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.14128141355309923, "ground_truth": 0}, {"key": "7a02e707b139791920fb13115d6132541fff7d97", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.024798161562208397, "ground_truth": 0}, {"key": "7a02e707b139791920fb13115d6132541fff7d97", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.13296425138056062, "ground_truth": 0}, {"key": "db1972f0204c7a9c292f4c85e8838251cb26625e", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.20817893894977077, "ground_truth": 0}, {"key": "db1972f0204c7a9c292f4c85e8838251cb26625e", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.4092207763493744, "ground_truth": 0}, {"key": "db1972f0204c7a9c292f4c85e8838251cb26625e", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.38121955522248446, "ground_truth": 0}, {"key": "db1972f0204c7a9c292f4c85e8838251cb26625e", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.3904758554201955, "ground_truth": 0}, {"key": "db1972f0204c7a9c292f4c85e8838251cb26625e", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.5389832227854917, "ground_truth": 0}, {"key": "6defcdfd6995661fd681dc15163d67f6a5d6727b", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.8799743656083547, "ground_truth": 0}, {"key": "6defcdfd6995661fd681dc15163d67f6a5d6727b", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.5136684713329717, "ground_truth": 0}, {"key": "6defcdfd6995661fd681dc15163d67f6a5d6727b", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.6601723820335581, "ground_truth": 0}, {"key": "6defcdfd6995661fd681dc15163d67f6a5d6727b", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.8031737884731327, "ground_truth": 0}, {"key": "6defcdfd6995661fd681dc15163d67f6a5d6727b", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.8187367951206765, "ground_truth": 0}, {"key": "24716f5a39d23dafbe9a9df8fa002788d14d020b", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.1347759187040591, "ground_truth": 0}, {"key": "24716f5a39d23dafbe9a9df8fa002788d14d020b", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.11838510508274058, "ground_truth": 0}, {"key": "24716f5a39d23dafbe9a9df8fa002788d14d020b", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.10818895139880681, "ground_truth": 0}, {"key": "24716f5a39d23dafbe9a9df8fa002788d14d020b", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.19559406907935672, "ground_truth": 0}, {"key": "24716f5a39d23dafbe9a9df8fa002788d14d020b", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.10302443492773178, "ground_truth": 0}, {"key": "ab3c98cf7833b842898a568d872e45ceb2f7dda9", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.18126320938308577, "ground_truth": 0}, {"key": "ab3c98cf7833b842898a568d872e45ceb2f7dda9", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.3023910947758851, "ground_truth": 0}, {"key": "ab3c98cf7833b842898a568d872e45ceb2f7dda9", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.3415825010252682, "ground_truth": 0}, {"key": "ab3c98cf7833b842898a568d872e45ceb2f7dda9", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.31237001354867766, "ground_truth": 0}, {"key": "ab3c98cf7833b842898a568d872e45ceb2f7dda9", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.5583269905278556, "ground_truth": 0}, {"key": "831005755f85012c882f17c3b3699b34a7febb7b", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.8187367893315256, "ground_truth": 0}, {"key": "831005755f85012c882f17c3b3699b34a7febb7b", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.8783142447298949, "ground_truth": 0}, {"key": "831005755f85012c882f17c3b3699b34a7febb7b", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.782662483475502, "ground_truth": 0}, {"key": "831005755f85012c882f17c3b3699b34a7febb7b", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.7943849569068645, "ground_truth": 0}, {"key": "831005755f85012c882f17c3b3699b34a7febb7b", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.8104789063508333, "ground_truth": 0}, {"key": "0590a8c653b7d332d9df195dcf3ce014abb4eff7", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.4035668589870899, "ground_truth": 0}, {"key": "0590a8c653b7d332d9df195dcf3ce014abb4eff7", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.5292633988051273, "ground_truth": 0}, {"key": "0590a8c653b7d332d9df195dcf3ce014abb4eff7", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.3468730800721054, "ground_truth": 0}, {"key": "0590a8c653b7d332d9df195dcf3ce014abb4eff7", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.19806418969085615, "ground_truth": 0}, {"key": "0590a8c653b7d332d9df195dcf3ce014abb4eff7", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.5563995816896755, "ground_truth": 0}, {"key": "f79341438eed40986c3219b67a3b5d87eb6c018a", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.4902356193177672, "ground_truth": 0}, {"key": "f79341438eed40986c3219b67a3b5d87eb6c018a", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.6334102547551425, "ground_truth": 0}, {"key": "f79341438eed40986c3219b67a3b5d87eb6c018a", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.7759445316783806, "ground_truth": 0}, {"key": "f79341438eed40986c3219b67a3b5d87eb6c018a", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.7122321828675943, "ground_truth": 0}, {"key": "f79341438eed40986c3219b67a3b5d87eb6c018a", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.8311430543837752, "ground_truth": 0}, {"key": "8db6225f67580d64a196f2f3197386a6be950a09", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.7905303011528145, "ground_truth": 0}, {"key": "8db6225f67580d64a196f2f3197386a6be950a09", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.4035668736986194, "ground_truth": 0}, {"key": "8db6225f67580d64a196f2f3197386a6be950a09", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.7476159508826263, "ground_truth": 0}, {"key": "8db6225f67580d64a196f2f3197386a6be950a09", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.40356687022142573, "ground_truth": 0}, {"key": "8db6225f67580d64a196f2f3197386a6be950a09", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.7025300483309006, "ground_truth": 0}, {"key": "e386d9ed70bac668fa6048b572f445d9b7b62f75", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.622459334041105, "ground_truth": 0}, {"key": "e386d9ed70bac668fa6048b572f445d9b7b62f75", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.6261241758506553, "ground_truth": 0}, {"key": "e386d9ed70bac668fa6048b572f445d9b7b62f75", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.7839884696856563, "ground_truth": 0}, {"key": "e386d9ed70bac668fa6048b572f445d9b7b62f75", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.5583269776550142, "ground_truth": 0}, {"key": "e386d9ed70bac668fa6048b572f445d9b7b62f75", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.6859494497811539, "ground_truth": 0}, {"key": "e35669d4530ea55bc8f0e451268cab9e9eaeab92", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.2295352049178996, "ground_truth": 0}, {"key": "e35669d4530ea55bc8f0e451268cab9e9eaeab92", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.1059482858350099, "ground_truth": 0}, {"key": "e35669d4530ea55bc8f0e451268cab9e9eaeab92", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.11838510396329231, "ground_truth": 0}, {"key": "e35669d4530ea55bc8f0e451268cab9e9eaeab92", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.18594720878923207, "ground_truth": 0}, {"key": "e35669d4530ea55bc8f0e451268cab9e9eaeab92", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.10669059029175335, "ground_truth": 0}, {"key": "d3ca193f45aef9aa766d52fbc58d6b8f1658ee60", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.07531230499511393, "ground_truth": 0}, {"key": "d3ca193f45aef9aa766d52fbc58d6b8f1658ee60", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.20817893874574186, "ground_truth": 0}, {"key": "d3ca193f45aef9aa766d52fbc58d6b8f1658ee60", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.40922079371554104, "ground_truth": 0}, {"key": "d3ca193f45aef9aa766d52fbc58d6b8f1658ee60", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.2583259774236843, "ground_truth": 0}, {"key": "d3ca193f45aef9aa766d52fbc58d6b8f1658ee60", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.4035668729416707, "ground_truth": 0}, {"key": "1ca9bf09bf534add02b7cfe6ebae6d17cde66286", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.329391728604655, "ground_truth": 0}, {"key": "1ca9bf09bf534add02b7cfe6ebae6d17cde66286", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.4824291244949363, "ground_truth": 0}, {"key": "1ca9bf09bf534add02b7cfe6ebae6d17cde66286", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.6169358282252965, "ground_truth": 0}, {"key": "1ca9bf09bf534add02b7cfe6ebae6d17cde66286", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.47657967493061953, "ground_truth": 0}, {"key": "1ca9bf09bf534add02b7cfe6ebae6d17cde66286", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.6774740235270191, "ground_truth": 0}, {"key": "c296e88117bef515bd9b36ad560223df3fd2b84c", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.3738758150209502, "ground_truth": 0}, {"key": "c296e88117bef515bd9b36ad560223df3fd2b84c", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.2658804640460054, "ground_truth": 0}, {"key": "c296e88117bef515bd9b36ad560223df3fd2b84c", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.25832597795450857, "ground_truth": 0}, {"key": "c296e88117bef515bd9b36ad560223df3fd2b84c", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.1721718452720213, "ground_truth": 0}, {"key": "c296e88117bef515bd9b36ad560223df3fd2b84c", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.5964331365275664, "ground_truth": 0}, {"key": "c5e11ee4c2f0ae511bd0e1fae2978d070b1efc15", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.10158944682463654, "ground_truth": 0}, {"key": "c5e11ee4c2f0ae511bd0e1fae2978d070b1efc15", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.33633105533913454, "ground_truth": 0}, {"key": "c5e11ee4c2f0ae511bd0e1fae2978d070b1efc15", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.12421300770382598, "ground_truth": 0}, {"key": "c5e11ee4c2f0ae511bd0e1fae2978d070b1efc15", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.13477591282553608, "ground_truth": 0}, {"key": "c5e11ee4c2f0ae511bd0e1fae2978d070b1efc15", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.23091976403299808, "ground_truth": 0}, {"key": "1fc2d1ecf1ffdc2f0b642b686e1c21de53a4fd28", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.36116470698688136, "ground_truth": 0}, {"key": "1fc2d1ecf1ffdc2f0b642b686e1c21de53a4fd28", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.48242909889855895, "ground_truth": 0}, {"key": "1fc2d1ecf1ffdc2f0b642b686e1c21de53a4fd28", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.5467381354928105, "ground_truth": 0}, {"key": "1fc2d1ecf1ffdc2f0b642b686e1c21de53a4fd28", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.2538610277213386, "ground_truth": 0}, {"key": "1fc2d1ecf1ffdc2f0b642b686e1c21de53a4fd28", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.45519860286452735, "ground_truth": 0}, {"key": "6556c64821ece8123c130b27285efe9619c3c7fd", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.16667539781741303, "ground_truth": 0}, {"key": "6556c64821ece8123c130b27285efe9619c3c7fd", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.4301473529356274, "ground_truth": 0}, {"key": "6556c64821ece8123c130b27285efe9619c3c7fd", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.4282333888864543, "ground_truth": 0}, {"key": "6556c64821ece8123c130b27285efe9619c3c7fd", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.35220178563186094, "ground_truth": 0}, {"key": "6556c64821ece8123c130b27285efe9619c3c7fd", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.9385759621000842, "ground_truth": 0}, {"key": "32ba61f4513f7ec21cedb6ddd2a8a93260f8cd56", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.26740816405223383, "ground_truth": 0}, {"key": "32ba61f4513f7ec21cedb6ddd2a8a93260f8cd56", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.49414090505879116, "ground_truth": 0}, {"key": "32ba61f4513f7ec21cedb6ddd2a8a93260f8cd56", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.361164722903621, "ground_truth": 0}, {"key": "32ba61f4513f7ec21cedb6ddd2a8a93260f8cd56", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.4339814587198407, "ground_truth": 0}, {"key": "32ba61f4513f7ec21cedb6ddd2a8a93260f8cd56", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.6132365660450403, "ground_truth": 0}, {"key": "1146cfc5981ce23511ac1bac5f3957c30bebc7b8", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.2583259910549606, "ground_truth": 0}, {"key": "1146cfc5981ce23511ac1bac5f3957c30bebc7b8", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.6477982157978674, "ground_truth": 0}, {"key": "1146cfc5981ce23511ac1bac5f3957c30bebc7b8", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.12085323365935766, "ground_truth": 0}, {"key": "1146cfc5981ce23511ac1bac5f3957c30bebc7b8", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.12252321602464093, "ground_truth": 0}, {"key": "1146cfc5981ce23511ac1bac5f3957c30bebc7b8", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.44939263483005554, "ground_truth": 0}, {"key": "e060abdb2a5e2ce6152ca0ed53703a9d17b2df36", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.11279539419808614, "ground_truth": 0}, {"key": "e060abdb2a5e2ce6152ca0ed53703a9d17b2df36", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.19436781699847133, "ground_truth": 0}, {"key": "e060abdb2a5e2ce6152ca0ed53703a9d17b2df36", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.1824255403624729, "ground_truth": 0}, {"key": "e060abdb2a5e2ce6152ca0ed53703a9d17b2df36", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.2267836201818291, "ground_truth": 0}, {"key": "e060abdb2a5e2ce6152ca0ed53703a9d17b2df36", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.17217185404671903, "ground_truth": 0}, {"key": "aef2a80ff67e87a8c165a481ede2a643128f4aa7", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.3225259886384656, "ground_truth": 0}, {"key": "aef2a80ff67e87a8c165a481ede2a643128f4aa7", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.3575675222654597, "ground_truth": 0}, {"key": "aef2a80ff67e87a8c165a481ede2a643128f4aa7", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.42250463917321823, "ground_truth": 0}, {"key": "aef2a80ff67e87a8c165a481ede2a643128f4aa7", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.3225259885117071, "ground_truth": 0}, {"key": "aef2a80ff67e87a8c165a481ede2a643128f4aa7", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.47852885311395366, "ground_truth": 0}, {"key": "d4eaedd7f1055f95e9cafa21e870d049f5df8526", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.30074558967552184, "ground_truth": 0}, {"key": "d4eaedd7f1055f95e9cafa21e870d049f5df8526", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.3040416910360669, "ground_truth": 0}, {"key": "d4eaedd7f1055f95e9cafa21e870d049f5df8526", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.26284184609345007, "ground_truth": 0}, {"key": "d4eaedd7f1055f95e9cafa21e870d049f5df8526", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.17667161422023533, "ground_truth": 0}, {"key": "d4eaedd7f1055f95e9cafa21e870d049f5df8526", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.15203224659615186, "ground_truth": 0}, {"key": "ec9531cd58e385f0da60e23b2855a3c5ece3f270", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.4455295701954023, "ground_truth": 0}, {"key": "ec9531cd58e385f0da60e23b2855a3c5ece3f270", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.24798744516220686, "ground_truth": 0}, {"key": "ec9531cd58e385f0da60e23b2855a3c5ece3f270", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.1431877038883054, "ground_truth": 0}, {"key": "ec9531cd58e385f0da60e23b2855a3c5ece3f270", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.08756384768345445, "ground_truth": 0}, {"key": "ec9531cd58e385f0da60e23b2855a3c5ece3f270", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.16776334400677098, "ground_truth": 0}, {"key": "b171bad51c8ec09118fd553347c41d9301f195ee", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.2720245686989843, "ground_truth": 0}, {"key": "b171bad51c8ec09118fd553347c41d9301f195ee", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.13296423659682574, "ground_truth": 0}, {"key": "b171bad51c8ec09118fd553347c41d9301f195ee", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.23510839000719416, "ground_truth": 0}, {"key": "b171bad51c8ec09118fd553347c41d9301f195ee", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.2782567966784942, "ground_truth": 0}, {"key": "b171bad51c8ec09118fd553347c41d9301f195ee", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.1835936269468566, "ground_truth": 0}, {"key": "1df14bd442bd39ed653aa77a1e77105d4b321db0", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.22405545838465346, "ground_truth": 0}, {"key": "1df14bd442bd39ed653aa77a1e77105d4b321db0", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.2909808882626988, "ground_truth": 0}, {"key": "1df14bd442bd39ed653aa77a1e77105d4b321db0", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.4378234910684842, "ground_truth": 0}, {"key": "1df14bd442bd39ed653aa77a1e77105d4b321db0", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.1699562368813938, "ground_truth": 0}, {"key": "1df14bd442bd39ed653aa77a1e77105d4b321db0", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.45519860501381293, "ground_truth": 0}, {"key": "d4f57e3c18c38696345fb7a3d76a151bb9c5123b", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.205615033280015, "ground_truth": 0}, {"key": "d4f57e3c18c38696345fb7a3d76a151bb9c5123b", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.3293917179261819, "ground_truth": 0}, {"key": "d4f57e3c18c38696345fb7a3d76a151bb9c5123b", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.2240554531606252, "ground_truth": 0}, {"key": "d4f57e3c18c38696345fb7a3d76a151bb9c5123b", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.12765261829510685, "ground_truth": 0}, {"key": "d4f57e3c18c38696345fb7a3d76a151bb9c5123b", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.189521104653665, "ground_truth": 0}, {"key": "28bbbf57c580be154f0602cbfe8b63603ef5a3a4", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.11757213848131777, "ground_truth": 0}, {"key": "28bbbf57c580be154f0602cbfe8b63603ef5a3a4", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.05582314215786914, "ground_truth": 0}, {"key": "28bbbf57c580be154f0602cbfe8b63603ef5a3a4", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.07978201890906686, "ground_truth": 0}, {"key": "28bbbf57c580be154f0602cbfe8b63603ef5a3a4", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.09203285943452863, "ground_truth": 0}, {"key": "28bbbf57c580be154f0602cbfe8b63603ef5a3a4", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.08035746938330822, "ground_truth": 0}, {"key": "05850904cabf491c9ab7c0e0d85fd932eb8c0bb0", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.2407746071198076, "ground_truth": 0}, {"key": "05850904cabf491c9ab7c0e0d85fd932eb8c0bb0", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.29421497003146635, "ground_truth": 0}, {"key": "05850904cabf491c9ab7c0e0d85fd932eb8c0bb0", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.3276682996476735, "ground_truth": 0}, {"key": "05850904cabf491c9ab7c0e0d85fd932eb8c0bb0", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.2107663051963761, "ground_truth": 0}, {"key": "05850904cabf491c9ab7c0e0d85fd932eb8c0bb0", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.31573597679048987, "ground_truth": 0}, {"key": "df79c0f955e4ccf51ad45780f865e334d3577bf5", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.3849121724516902, "ground_truth": 0}, {"key": "df79c0f955e4ccf51ad45780f865e334d3577bf5", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.30735802390093947, "ground_truth": 0}, {"key": "df79c0f955e4ccf51ad45780f865e334d3577bf5", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.32423539588083977, "ground_truth": 0}, {"key": "df79c0f955e4ccf51ad45780f865e334d3577bf5", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.35577488646433464, "ground_truth": 0}, {"key": "df79c0f955e4ccf51ad45780f865e334d3577bf5", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.3812195779538631, "ground_truth": 0}, {"key": "ffb8b9be838da033f6f3383f324d425556723147", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.45519861024994634, "ground_truth": 0}, {"key": "ffb8b9be838da033f6f3383f324d425556723147", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.3738758142098963, "ground_truth": 0}, {"key": "ffb8b9be838da033f6f3383f324d425556723147", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.26740816582043636, "ground_truth": 0}, {"key": "ffb8b9be838da033f6f3383f324d425556723147", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.24653334356319936, "ground_truth": 0}, {"key": "ffb8b9be838da033f6f3383f324d425556723147", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.5234203331168045, "ground_truth": 0}, {"key": "d70dcffc2c07e08cc121d7126ada53dbc479626e", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.40922079936765016, "ground_truth": 0}, {"key": "d70dcffc2c07e08cc121d7126ada53dbc479626e", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.38121956604142976, "ground_truth": 0}, {"key": "d70dcffc2c07e08cc121d7126ada53dbc479626e", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.6442251256995978, "ground_truth": 0}, {"key": "d70dcffc2c07e08cc121d7126ada53dbc479626e", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.25238403539630816, "ground_truth": 0}, {"key": "d70dcffc2c07e08cc121d7126ada53dbc479626e", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.3812195389430618, "ground_truth": 0}, {"key": "4dc0cef39980df6382f9aee5e150e904fe62965e", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.6206216037040541, "ground_truth": 0}, {"key": "4dc0cef39980df6382f9aee5e150e904fe62965e", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.6057990158031583, "ground_truth": 0}, {"key": "4dc0cef39980df6382f9aee5e150e904fe62965e", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.7356416226028014, "ground_truth": 0}, {"key": "4dc0cef39980df6382f9aee5e150e904fe62965e", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.7217431810724187, "ground_truth": 0}, {"key": "4dc0cef39980df6382f9aee5e150e904fe62965e", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.6619228717851563, "ground_truth": 0}, {"key": "6cb082c504e00c93686ff1e9287a84ba13c12b79", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.5544704662360432, "ground_truth": 0}, {"key": "6cb082c504e00c93686ff1e9287a84ba13c12b79", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.21866938774328787, "ground_truth": 0}, {"key": "6cb082c504e00c93686ff1e9287a84ba13c12b79", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.2751297268076011, "ground_truth": 0}, {"key": "6cb082c504e00c93686ff1e9287a84ba13c12b79", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.6261241740211126, "ground_truth": 0}, {"key": "6cb082c504e00c93686ff1e9287a84ba13c12b79", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.3665897500462879, "ground_truth": 0}, {"key": "19fe2a8e0bef37b495afcc83c2f46b60c56039bf", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.29583986998792794, "ground_truth": 0}, {"key": "19fe2a8e0bef37b495afcc83c2f46b60c56039bf", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.15304216010783733, "ground_truth": 0}, {"key": "19fe2a8e0bef37b495afcc83c2f46b60c56039bf", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.14804718573343384, "ground_truth": 0}, {"key": "19fe2a8e0bef37b495afcc83c2f46b60c56039bf", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.2379298737268942, "ground_truth": 0}, {"key": "19fe2a8e0bef37b495afcc83c2f46b60c56039bf", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.2436424574852702, "ground_truth": 0}, {"key": "503c6aaeaf0e61372a896ebe1fdf2a2492844fe4", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.3539862929763176, "ground_truth": 0}, {"key": "503c6aaeaf0e61372a896ebe1fdf2a2492844fe4", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.484380090456646, "ground_truth": 0}, {"key": "503c6aaeaf0e61372a896ebe1fdf2a2492844fe4", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.5331543928429784, "ground_truth": 0}, {"key": "503c6aaeaf0e61372a896ebe1fdf2a2492844fe4", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.2613309224386111, "ground_truth": 0}, {"key": "503c6aaeaf0e61372a896ebe1fdf2a2492844fe4", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.4571367103943777, "ground_truth": 0}, {"key": "e4007135fdafe84907e2b018da3a4c7ab853c251", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.05623634163415358, "ground_truth": 0}, {"key": "e4007135fdafe84907e2b018da3a4c7ab853c251", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.31237001327092623, "ground_truth": 0}, {"key": "e4007135fdafe84907e2b018da3a4c7ab853c251", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.22000710813595165, "ground_truth": 0}, {"key": "e4007135fdafe84907e2b018da3a4c7ab853c251", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.16238002465901866, "ground_truth": 0}, {"key": "e4007135fdafe84907e2b018da3a4c7ab853c251", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.1634454330084946, "ground_truth": 0}, {"key": "5b97a507eed113ce329e8c85078fb53033bbe567", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.11279540620071106, "ground_truth": 0}, {"key": "5b97a507eed113ce329e8c85078fb53033bbe567", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.12085323370122966, "ground_truth": 0}, {"key": "5b97a507eed113ce329e8c85078fb53033bbe567", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.15610490678445113, "ground_truth": 0}, {"key": "5b97a507eed113ce329e8c85078fb53033bbe567", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.11436851916413152, "ground_truth": 0}, {"key": "5b97a507eed113ce329e8c85078fb53033bbe567", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.24220562975148674, "ground_truth": 0}, {"key": "145a118e355e3a92383b41307a5b473a7c77a8bb", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.45519860321815053, "ground_truth": 0}, {"key": "145a118e355e3a92383b41307a5b473a7c77a8bb", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.5019530962551207, "ground_truth": 0}, {"key": "145a118e355e3a92383b41307a5b473a7c77a8bb", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.3539862921627673, "ground_truth": 0}, {"key": "145a118e355e3a92383b41307a5b473a7c77a8bb", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.5097643844742323, "ground_truth": 0}, {"key": "145a118e355e3a92383b41307a5b473a7c77a8bb", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.7879311867023171, "ground_truth": 0}, {"key": "1f6309c88c5711b2b579e3c0cf699c44d3b56d16", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.22953521879391853, "ground_truth": 0}, {"key": "1f6309c88c5711b2b579e3c0cf699c44d3b56d16", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.13477591740440412, "ground_truth": 0}, {"key": "1f6309c88c5711b2b579e3c0cf699c44d3b56d16", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.10594828625347237, "ground_truth": 0}, {"key": "1f6309c88c5711b2b579e3c0cf699c44d3b56d16", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.45713674466734433, "ground_truth": 0}, {"key": "1f6309c88c5711b2b579e3c0cf699c44d3b56d16", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.20307463270553855, "ground_truth": 0}, {"key": "d8304c60e76a4b16053e74c50abd886dcdf7397c", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.21733751697240222, "ground_truth": 0}, {"key": "d8304c60e76a4b16053e74c50abd886dcdf7397c", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.27512972435672745, "ground_truth": 0}, {"key": "d8304c60e76a4b16053e74c50abd886dcdf7397c", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.4416730132398759, "ground_truth": 0}, {"key": "d8304c60e76a4b16053e74c50abd886dcdf7397c", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.22405546114949015, "ground_truth": 0}, {"key": "d8304c60e76a4b16053e74c50abd886dcdf7397c", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.3040416844085305, "ground_truth": 0}, {"key": "d47e5724a866cf365428dbded7740555e5f80f2b", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.19559408531643768, "ground_truth": 0}, {"key": "d47e5724a866cf365428dbded7740555e5f80f2b", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.17667160714876728, "ground_truth": 0}, {"key": "d47e5724a866cf365428dbded7740555e5f80f2b", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.383064188859472, "ground_truth": 0}, {"key": "d47e5724a866cf365428dbded7740555e5f80f2b", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.06656918690711974, "ground_truth": 0}, {"key": "d47e5724a866cf365428dbded7740555e5f80f2b", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.25238404882024695, "ground_truth": 0}, {"key": "0a078513cee66db2ccaaca1b7b0755c96f0c5c8a", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.2267836553438311, "ground_truth": 0}, {"key": "0a078513cee66db2ccaaca1b7b0755c96f0c5c8a", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.5234203412102512, "ground_truth": 0}, {"key": "0a078513cee66db2ccaaca1b7b0755c96f0c5c8a", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.5851011396124406, "ground_truth": 0}, {"key": "0a078513cee66db2ccaaca1b7b0755c96f0c5c8a", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.18476751441781356, "ground_truth": 0}, {"key": "0a078513cee66db2ccaaca1b7b0755c96f0c5c8a", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.4167966442065954, "ground_truth": 0}, {"key": "f0d93bdd383762936746b48f7e67ffe72cfb1ede", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.8723473833790278, "ground_truth": 0}, {"key": "f0d93bdd383762936746b48f7e67ffe72cfb1ede", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.6859494460600696, "ground_truth": 0}, {"key": "f0d93bdd383762936746b48f7e67ffe72cfb1ede", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.6740504583835532, "ground_truth": 0}, {"key": "f0d93bdd383762936746b48f7e67ffe72cfb1ede", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.7041601136521484, "ground_truth": 0}, {"key": "f0d93bdd383762936746b48f7e67ffe72cfb1ede", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.5926665890237094, "ground_truth": 0}, {"key": "38649fdccec39afa649297349b2ad2e5e1a39d82", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.35936413396040257, "ground_truth": 0}, {"key": "38649fdccec39afa649297349b2ad2e5e1a39d82", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.3380771429842281, "ground_truth": 0}, {"key": "38649fdccec39afa649297349b2ad2e5e1a39d82", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.4073334060434735, "ground_truth": 0}, {"key": "38649fdccec39afa649297349b2ad2e5e1a39d82", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.432063400134344, "ground_truth": 0}, {"key": "38649fdccec39afa649297349b2ad2e5e1a39d82", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.33285234334990144, "ground_truth": 0}, {"key": "d86d9a4e0b39556578f24ff54ed82716f0375fdb", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.75055276968227, "ground_truth": 0}, {"key": "d86d9a4e0b39556578f24ff54ed82716f0375fdb", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.4629585957217483, "ground_truth": 0}, {"key": "d86d9a4e0b39556578f24ff54ed82716f0375fdb", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.3276682909337919, "ground_truth": 0}, {"key": "d86d9a4e0b39556578f24ff54ed82716f0375fdb", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.6688802789247571, "ground_truth": 0}, {"key": "d86d9a4e0b39556578f24ff54ed82716f0375fdb", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.4571367154116556, "ground_truth": 0}, {"key": "d10d57811499caa54276d3e14f89c45cb1a8958f", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.39793842496250714, "ground_truth": 0}, {"key": "d10d57811499caa54276d3e14f89c45cb1a8958f", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.10374862871281446, "ground_truth": 0}, {"key": "d10d57811499caa54276d3e14f89c45cb1a8958f", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.20561504065678693, "ground_truth": 0}, {"key": "d10d57811499caa54276d3e14f89c45cb1a8958f", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.1200256321612559, "ground_truth": 0}, {"key": "d10d57811499caa54276d3e14f89c45cb1a8958f", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.5331543847448672, "ground_truth": 0}, {"key": "66646c49afb65308491ec8ca6db79aa76263cc69", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.19806417722489472, "ground_truth": 0}, {"key": "66646c49afb65308491ec8ca6db79aa76263cc69", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.1801066705432026, "ground_truth": 0}, {"key": "66646c49afb65308491ec8ca6db79aa76263cc69", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.25534368065506247, "ground_truth": 0}, {"key": "66646c49afb65308491ec8ca6db79aa76263cc69", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.21601153065523068, "ground_truth": 0}, {"key": "66646c49afb65308491ec8ca6db79aa76263cc69", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.10158944363942549, "ground_truth": 0}, {"key": "7fbd6d867def06f6ae4c051562dc36ab8d0038c0", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.22000710426626832, "ground_truth": 0}, {"key": "7fbd6d867def06f6ae4c051562dc36ab8d0038c0", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.21076630113169736, "ground_truth": 0}, {"key": "7fbd6d867def06f6ae4c051562dc36ab8d0038c0", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.2509127911251463, "ground_truth": 0}, {"key": "7fbd6d867def06f6ae4c051562dc36ab8d0038c0", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.21866938475139672, "ground_truth": 0}, {"key": "7fbd6d867def06f6ae4c051562dc36ab8d0038c0", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.2829881292396276, "ground_truth": 0}, {"key": "5c243b51bf4de7f6974338d71ac26317254007bb", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.43590154378586976, "ground_truth": 0}, {"key": "5c243b51bf4de7f6974338d71ac26317254007bb", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.5506073415398773, "ground_truth": 0}, {"key": "5c243b51bf4de7f6974338d71ac26317254007bb", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.7264256141681981, "ground_truth": 0}, {"key": "5c243b51bf4de7f6974338d71ac26317254007bb", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.7041601283694765, "ground_truth": 0}, {"key": "5c243b51bf4de7f6974338d71ac26317254007bb", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.649578633134912, "ground_truth": 0}, {"key": "56b79c03a77d5261382e4705f3537396473f55cf", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.8031737874396455, "ground_truth": 0}, {"key": "56b79c03a77d5261382e4705f3537396473f55cf", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.7520125667190358, "ground_truth": 0}, {"key": "56b79c03a77d5261382e4705f3537396473f55cf", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.6113819762007267, "ground_truth": 0}, {"key": "56b79c03a77d5261382e4705f3537396473f55cf", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.4726834619364374, "ground_truth": 0}, {"key": "56b79c03a77d5261382e4705f3537396473f55cf", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.7170118570894547, "ground_truth": 0}, {"key": "7382d171d71d3219c5ad0a13ea0ac92ac6b6998b", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.39606818765863827, "ground_truth": 0}, {"key": "7382d171d71d3219c5ad0a13ea0ac92ac6b6998b", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.20055768437749813, "ground_truth": 0}, {"key": "7382d171d71d3219c5ad0a13ea0ac92ac6b6998b", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.25534364484911903, "ground_truth": 0}, {"key": "7382d171d71d3219c5ad0a13ea0ac92ac6b6998b", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.4493926403808059, "ground_truth": 0}, {"key": "7382d171d71d3219c5ad0a13ea0ac92ac6b6998b", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.31742628613667184, "ground_truth": 0}, {"key": "ef1a5fa8dbba16e4d7ef3fc8cd540c2f55691fc8", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.3468730753726313, "ground_truth": 0}, {"key": "ef1a5fa8dbba16e4d7ef3fc8cd540c2f55691fc8", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.33285232978975815, "ground_truth": 0}, {"key": "ef1a5fa8dbba16e4d7ef3fc8cd540c2f55691fc8", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.26894144211442744, "ground_truth": 0}, {"key": "ef1a5fa8dbba16e4d7ef3fc8cd540c2f55691fc8", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.3720487905888033, "ground_truth": 0}, {"key": "ef1a5fa8dbba16e4d7ef3fc8cd540c2f55691fc8", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.8577681102439179, "ground_truth": 0}, {"key": "1ba0f66a7f4f23171634a3455893f4d5b8b94db4", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.7534666502149846, "ground_truth": 0}, {"key": "1ba0f66a7f4f23171634a3455893f4d5b8b94db4", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.4610167910381477, "ground_truth": 0}, {"key": "1ba0f66a7f4f23171634a3455893f4d5b8b94db4", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.5660185402118277, "ground_truth": 0}, {"key": "1ba0f66a7f4f23171634a3455893f4d5b8b94db4", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.6113819829848898, "ground_truth": 0}, {"key": "1ba0f66a7f4f23171634a3455893f4d5b8b94db4", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.6039318219268802, "ground_truth": 0}, {"key": "3131e8ba238a31d83cad00bc7b02933b0a3587b3", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.21601153521522418, "ground_truth": 0}, {"key": "3131e8ba238a31d83cad00bc7b02933b0a3587b3", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.5019530962551207, "ground_truth": 0}, {"key": "3131e8ba238a31d83cad00bc7b02933b0a3587b3", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.21206879954940422, "ground_truth": 0}, {"key": "3131e8ba238a31d83cad00bc7b02933b0a3587b3", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.5097643844742323, "ground_truth": 0}, {"key": "3131e8ba238a31d83cad00bc7b02933b0a3587b3", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.7879311867023171, "ground_truth": 0}, {"key": "112bc4ab4b6e7d6dd35fc33cd946fbfc4c9356d6", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.16451645046232422, "ground_truth": 0}, {"key": "112bc4ab4b6e7d6dd35fc33cd946fbfc4c9356d6", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.32939171740761797, "ground_truth": 0}, {"key": "112bc4ab4b6e7d6dd35fc33cd946fbfc4c9356d6", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.4960938455351328, "ground_truth": 0}, {"key": "112bc4ab4b6e7d6dd35fc33cd946fbfc4c9356d6", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.11357958690216877, "ground_truth": 0}, {"key": "112bc4ab4b6e7d6dd35fc33cd946fbfc4c9356d6", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.21866938280623524, "ground_truth": 0}, {"key": "3b1d3309825780556178569cd40d880a793f8da7", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.5409238946227797, "ground_truth": 0}, {"key": "3b1d3309825780556178569cd40d880a793f8da7", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.4785288389613415, "ground_truth": 0}, {"key": "3b1d3309825780556178569cd40d880a793f8da7", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.47073661793209065, "ground_truth": 0}, {"key": "3b1d3309825780556178569cd40d880a793f8da7", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.6495786250630323, "ground_truth": 0}, {"key": "3b1d3309825780556178569cd40d880a793f8da7", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.48828338750928574, "ground_truth": 0}, {"key": "c977693b405a89cec98e53b05199e608fd6adeca", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.3960681604508836, "ground_truth": 0}, {"key": "c977693b405a89cec98e53b05199e608fd6adeca", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.1571368517410344, "ground_truth": 0}, {"key": "c977693b405a89cec98e53b05199e608fd6adeca", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.23091975940114565, "ground_truth": 0}, {"key": "c977693b405a89cec98e53b05199e608fd6adeca", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.31405054916571, "ground_truth": 0}, {"key": "c977693b405a89cec98e53b05199e608fd6adeca", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.44167297613375495, "ground_truth": 0}, {"key": "c84e272a80fa95f863e016bc54df0841fd83fc12", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.07531230877409185, "ground_truth": 0}, {"key": "c84e272a80fa95f863e016bc54df0841fd83fc12", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.1451153597859632, "ground_truth": 0}, {"key": "c84e272a80fa95f863e016bc54df0841fd83fc12", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.09534946223396269, "ground_truth": 0}, {"key": "c84e272a80fa95f863e016bc54df0841fd83fc12", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.15304215826673345, "ground_truth": 0}, {"key": "c84e272a80fa95f863e016bc54df0841fd83fc12", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.19072402543073194, "ground_truth": 0}, {"key": "f51cff1d73cd0f3954376d7b3eab1d5b2ccb354c", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.4320633876590803, "ground_truth": 0}, {"key": "f51cff1d73cd0f3954376d7b3eab1d5b2ccb354c", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.2861692515323343, "ground_truth": 0}, {"key": "f51cff1d73cd0f3954376d7b3eab1d5b2ccb354c", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.5907791979327401, "ground_truth": 0}, {"key": "f51cff1d73cd0f3954376d7b3eab1d5b2ccb354c", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.44939263390252077, "ground_truth": 0}, {"key": "f51cff1d73cd0f3954376d7b3eab1d5b2ccb354c", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.1859472010706816, "ground_truth": 0}, {"key": "a98f1a0258f641788e570264b79e5c816f80054f", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.3904758381537146, "ground_truth": 0}, {"key": "a98f1a0258f641788e570264b79e5c816f80054f", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.2782567934590284, "ground_truth": 0}, {"key": "a98f1a0258f641788e570264b79e5c816f80054f", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.45713673989890247, "ground_truth": 0}, {"key": "a98f1a0258f641788e570264b79e5c816f80054f", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.607663148282258, "ground_truth": 0}, {"key": "a98f1a0258f641788e570264b79e5c816f80054f", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.2658804685512899, "ground_truth": 0}, {"key": "d69d50059c96bd729e9e4c54eee7901d43c0181d", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.3276682974673403, "ground_truth": 0}, {"key": "d69d50059c96bd729e9e4c54eee7901d43c0181d", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.2861692742590837, "ground_truth": 0}, {"key": "d69d50059c96bd729e9e4c54eee7901d43c0181d", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.5078118802967112, "ground_truth": 0}, {"key": "d69d50059c96bd729e9e4c54eee7901d43c0181d", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.2674081578661569, "ground_truth": 0}, {"key": "d69d50059c96bd729e9e4c54eee7901d43c0181d", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.21206880168840286, "ground_truth": 0}, {"key": "379692c378381f092c0bae0516ea8abc5bdb98b8", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.28298812143906543, "ground_truth": 0}, {"key": "379692c378381f092c0bae0516ea8abc5bdb98b8", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.18832398705244432, "ground_truth": 0}, {"key": "379692c378381f092c0bae0516ea8abc5bdb98b8", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.15507847455368193, "ground_truth": 0}, {"key": "379692c378381f092c0bae0516ea8abc5bdb98b8", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.24944722239914355, "ground_truth": 0}, {"key": "379692c378381f092c0bae0516ea8abc5bdb98b8", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.174410276954346, "ground_truth": 0}, {"key": "88b0d86cd06cd05a090f6a6c3a3ed17bf5f96df3", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.28616925777702096, "ground_truth": 0}, {"key": "88b0d86cd06cd05a090f6a6c3a3ed17bf5f96df3", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.3007455851561358, "ground_truth": 0}, {"key": "88b0d86cd06cd05a090f6a6c3a3ed17bf5f96df3", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.4921881502411732, "ground_truth": 0}, {"key": "88b0d86cd06cd05a090f6a6c3a3ed17bf5f96df3", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.14033625348304363, "ground_truth": 0}, {"key": "88b0d86cd06cd05a090f6a6c3a3ed17bf5f96df3", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.2658804710374481, "ground_truth": 0}, {"key": "3b46e80db81819fdcb8b8044941f64d0fa5abd11", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.47073659781118943, "ground_truth": 0}, {"key": "3b46e80db81819fdcb8b8044941f64d0fa5abd11", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.48828341351523336, "ground_truth": 0}, {"key": "3b46e80db81819fdcb8b8044941f64d0fa5abd11", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.38861802089725306, "ground_truth": 0}, {"key": "3b46e80db81819fdcb8b8044941f64d0fa5abd11", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.2814055900885198, "ground_truth": 0}, {"key": "3b46e80db81819fdcb8b8044941f64d0fa5abd11", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.3140505311319482, "ground_truth": 0}, {"key": "786d56f09dae2902696b680395353986051a1139", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.10447732599281312, "ground_truth": 0}, {"key": "786d56f09dae2902696b680395353986051a1139", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.17328820068530562, "ground_truth": 0}, {"key": "786d56f09dae2902696b680395353986051a1139", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.12506538461274788, "ground_truth": 0}, {"key": "786d56f09dae2902696b680395353986051a1139", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.29583987572851217, "ground_truth": 0}, {"key": "786d56f09dae2902696b680395353986051a1139", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.3174262793415555, "ground_truth": 0}, {"key": "bf1a3fd65fdd6e91ccec0663d80fa567eada14df", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.2674081572651209, "ground_truth": 0}, {"key": "bf1a3fd65fdd6e91ccec0663d80fa567eada14df", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.17217185393011666, "ground_truth": 0}, {"key": "bf1a3fd65fdd6e91ccec0663d80fa567eada14df", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.16132024174817802, "ground_truth": 0}, {"key": "bf1a3fd65fdd6e91ccec0663d80fa567eada14df", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.15921740387717376, "ground_truth": 0}, {"key": "bf1a3fd65fdd6e91ccec0663d80fa567eada14df", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.18242552710626356, "ground_truth": 0}, {"key": "a0bd3047a6de80e3924843f1961ce28347c6a548", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.35756751393919267, "ground_truth": 0}, {"key": "a0bd3047a6de80e3924843f1961ce28347c6a548", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.747615942826373, "ground_truth": 0}, {"key": "a0bd3047a6de80e3924843f1961ce28347c6a548", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.6020615778131259, "ground_truth": 0}, {"key": "a0bd3047a6de80e3924843f1961ce28347c6a548", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.6001883514386855, "ground_truth": 0}, {"key": "a0bd3047a6de80e3924843f1961ce28347c6a548", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.7401743611918948, "ground_truth": 0}, {"key": "090d322e93af624203dbd5dc83403170071c9e6a", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.21206880701770003, "ground_truth": 0}, {"key": "090d322e93af624203dbd5dc83403170071c9e6a", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.7106282987474317, "ground_truth": 0}, {"key": "090d322e93af624203dbd5dc83403170071c9e6a", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.8864204120573592, "ground_truth": 0}, {"key": "090d322e93af624203dbd5dc83403170071c9e6a", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.5832033671283395, "ground_truth": 0}, {"key": "090d322e93af624203dbd5dc83403170071c9e6a", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.8469578370448123, "ground_truth": 0}, {"key": "ed5179817cb8f597a760800fcdce2b8e64fd30dc", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.6334102635960108, "ground_truth": 0}, {"key": "ed5179817cb8f597a760800fcdce2b8e64fd30dc", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.8418256489831974, "ground_truth": 0}, {"key": "ed5179817cb8f597a760800fcdce2b8e64fd30dc", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.7490872101703757, "ground_truth": 0}, {"key": "ed5179817cb8f597a760800fcdce2b8e64fd30dc", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.5389832261054162, "ground_truth": 0}, {"key": "ed5179817cb8f597a760800fcdce2b8e64fd30dc", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.879146768544209, "ground_truth": 0}, {"key": "571a8023d0deed8c667dd41fed88290309e56927", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.4320633786601182, "ground_truth": 0}, {"key": "571a8023d0deed8c667dd41fed88290309e56927", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.8895288479123309, "ground_truth": 0}, {"key": "571a8023d0deed8c667dd41fed88290309e56927", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.3293917152345231, "ground_truth": 0}, {"key": "571a8023d0deed8c667dd41fed88290309e56927", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.2523840386973027, "ground_truth": 0}, {"key": "571a8023d0deed8c667dd41fed88290309e56927", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.1510278025855653, "ground_truth": 0}, {"key": "544d7c0cba7df38cc8dda8d0d91c6845cf5f52bb", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.5273165256662216, "ground_truth": 0}, {"key": "544d7c0cba7df38cc8dda8d0d91c6845cf5f52bb", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.3720487924687223, "ground_truth": 0}, {"key": "544d7c0cba7df38cc8dda8d0d91c6845cf5f52bb", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.43014736417630545, "ground_truth": 0}, {"key": "544d7c0cba7df38cc8dda8d0d91c6845cf5f52bb", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.29746994348504774, "ground_truth": 0}, {"key": "544d7c0cba7df38cc8dda8d0d91c6845cf5f52bb", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.6224593372262319, "ground_truth": 0}, {"key": "cbd3a0715a91ac8f651aa7b1f2c1fb37a2ef8a69", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.602061572898427, "ground_truth": 0}, {"key": "cbd3a0715a91ac8f651aa7b1f2c1fb37a2ef8a69", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.5486734757549739, "ground_truth": 0}, {"key": "cbd3a0715a91ac8f651aa7b1f2c1fb37a2ef8a69", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.694302675856837, "ground_truth": 0}, {"key": "cbd3a0715a91ac8f651aa7b1f2c1fb37a2ef8a69", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.6531268919691797, "ground_truth": 0}, {"key": "cbd3a0715a91ac8f651aa7b1f2c1fb37a2ef8a69", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.6619228825974957, "ground_truth": 0}, {"key": "4ca8b3cf75948dffea7b96e71bf1d9621107354b", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.5234203424675449, "ground_truth": 0}, {"key": "4ca8b3cf75948dffea7b96e71bf1d9621107354b", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.5117166046500385, "ground_truth": 0}, {"key": "4ca8b3cf75948dffea7b96e71bf1d9621107354b", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.4016877984126581, "ground_truth": 0}, {"key": "4ca8b3cf75948dffea7b96e71bf1d9621107354b", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.6825737169785379, "ground_truth": 0}, {"key": "4ca8b3cf75948dffea7b96e71bf1d9621107354b", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.44746029849799485, "ground_truth": 0}, {"key": "98f04e49605f36e0236b206fcb26a1549a7c00c6", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.14033624896174954, "ground_truth": 0}, {"key": "98f04e49605f36e0236b206fcb26a1549a7c00c6", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.17553806684224046, "ground_truth": 0}, {"key": "98f04e49605f36e0236b206fcb26a1549a7c00c6", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.08210663266812931, "ground_truth": 0}, {"key": "98f04e49605f36e0236b206fcb26a1549a7c00c6", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.2173375171761447, "ground_truth": 0}, {"key": "98f04e49605f36e0236b206fcb26a1549a7c00c6", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.45519858811323083, "ground_truth": 0}, {"key": "fb0003754a764d7f3252120de58b515d1f882556", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.533154398890051, "ground_truth": 0}, {"key": "fb0003754a764d7f3252120de58b515d1f882556", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.3942009462232628, "ground_truth": 0}, {"key": "fb0003754a764d7f3252120de58b515d1f882556", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.7217432004142753, "ground_truth": 0}, {"key": "fb0003754a764d7f3252120de58b515d1f882556", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.6113819734541452, "ground_truth": 0}, {"key": "fb0003754a764d7f3252120de58b515d1f882556", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.544801390596023, "ground_truth": 0}, {"key": "0130f10c1d700cf42cad5fd24b242667342c86be", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.2766905181303985, "ground_truth": 0}, {"key": "0130f10c1d700cf42cad5fd24b242667342c86be", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.6334102579509526, "ground_truth": 0}, {"key": "0130f10c1d700cf42cad5fd24b242667342c86be", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.3023910862032496, "ground_truth": 0}, {"key": "0130f10c1d700cf42cad5fd24b242667342c86be", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.23231015256713916, "ground_truth": 0}, {"key": "0130f10c1d700cf42cad5fd24b242667342c86be", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.5175708667203345, "ground_truth": 0}, {"key": "fb8431bc320c2c1a6c32699da0fdae228ed8d73b", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.06560483444561963, "ground_truth": 0}, {"key": "fb8431bc320c2c1a6c32699da0fdae228ed8d73b", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.08882028786160935, "ground_truth": 0}, {"key": "fb8431bc320c2c1a6c32699da0fdae228ed8d73b", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.15610490771794566, "ground_truth": 0}, {"key": "fb8431bc320c2c1a6c32699da0fdae228ed8d73b", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.0780781599227026, "ground_truth": 0}, {"key": "fb8431bc320c2c1a6c32699da0fdae228ed8d73b", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.0623310373751968, "ground_truth": 0}, {"key": "875d564015e85f88103edf0b36ce10e292334902", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.3960681836801333, "ground_truth": 0}, {"key": "875d564015e85f88103edf0b36ce10e292334902", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.43590151641032815, "ground_truth": 0}, {"key": "875d564015e85f88103edf0b36ce10e292334902", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.5409238588839665, "ground_truth": 0}, {"key": "875d564015e85f88103edf0b36ce10e292334902", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.3757064793646829, "ground_truth": 0}, {"key": "875d564015e85f88103edf0b36ce10e292334902", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.422504643764342, "ground_truth": 0}, {"key": "53102b470b50905c033a90940fc6fa87190f7343", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.3328523379740817, "ground_truth": 0}, {"key": "53102b470b50905c033a90940fc6fa87190f7343", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.3073580127278277, "ground_truth": 0}, {"key": "53102b470b50905c033a90940fc6fa87190f7343", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.27357439198385197, "ground_truth": 0}, {"key": "53102b470b50905c033a90940fc6fa87190f7343", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.22815650270158505, "ground_truth": 0}, {"key": "53102b470b50905c033a90940fc6fa87190f7343", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.19682620814621765, "ground_truth": 0}, {"key": "58776b77856719aff45f09e50d370f52c756dc10", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.1393963827808988, "ground_truth": 0}, {"key": "58776b77856719aff45f09e50d370f52c756dc10", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.1931473770775142, "ground_truth": 0}, {"key": "58776b77856719aff45f09e50d370f52c756dc10", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.11436852446129986, "ground_truth": 0}, {"key": "58776b77856719aff45f09e50d370f52c756dc10", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.26435835901970667, "ground_truth": 0}, {"key": "58776b77856719aff45f09e50d370f52c756dc10", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.26894140209068895, "ground_truth": 0}, {"key": "1b1479bb6e290e86e4b2a1e862e06909a0a62f8e", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.21337717759821667, "ground_truth": 0}, {"key": "1b1479bb6e290e86e4b2a1e862e06909a0a62f8e", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.19072402223249654, "ground_truth": 0}, {"key": "1b1479bb6e290e86e4b2a1e862e06909a0a62f8e", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.1955940715908975, "ground_truth": 0}, {"key": "1b1479bb6e290e86e4b2a1e862e06909a0a62f8e", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.09073548751612291, "ground_truth": 0}, {"key": "1b1479bb6e290e86e4b2a1e862e06909a0a62f8e", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.22815650186394051, "ground_truth": 0}, {"key": "137019bb8262f8ab776ec6367a0ae4b020fa638e", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.3793784085053963, "ground_truth": 0}, {"key": "137019bb8262f8ab776ec6367a0ae4b020fa638e", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.3504213735802313, "ground_truth": 0}, {"key": "137019bb8262f8ab776ec6367a0ae4b020fa638e", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.2909808729726766, "ground_truth": 0}, {"key": "137019bb8262f8ab776ec6367a0ae4b020fa638e", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.21469142198452795, "ground_truth": 0}, {"key": "137019bb8262f8ab776ec6367a0ae4b020fa638e", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.39793842183206385, "ground_truth": 0}, {"key": "1f738e018a3a193d04ec22612e4fe6b01b4969fe", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.47073661471982275, "ground_truth": 0}, {"key": "1f738e018a3a193d04ec22612e4fe6b01b4969fe", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.44360044154543493, "ground_truth": 0}, {"key": "1f738e018a3a193d04ec22612e4fe6b01b4969fe", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.5058591218709072, "ground_truth": 0}, {"key": "1f738e018a3a193d04ec22612e4fe6b01b4969fe", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.2991051818520459, "ground_truth": 0}, {"key": "1f738e018a3a193d04ec22612e4fe6b01b4969fe", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.6757646110630008, "ground_truth": 0}, {"key": "2bb7b7d5a229ccb9c9b5b4fa1475a54297fc0a25", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.35220177712812933, "ground_truth": 0}, {"key": "2bb7b7d5a229ccb9c9b5b4fa1475a54297fc0a25", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.45713671183157717, "ground_truth": 0}, {"key": "2bb7b7d5a229ccb9c9b5b4fa1475a54297fc0a25", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.2958398789127999, "ground_truth": 0}, {"key": "2bb7b7d5a229ccb9c9b5b4fa1475a54297fc0a25", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.43782351653015256, "ground_truth": 0}, {"key": "2bb7b7d5a229ccb9c9b5b4fa1475a54297fc0a25", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.592666584966968, "ground_truth": 0}, {"key": "c136c209869b227e534aca60b6df7e0b26bce7fe", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.5273165171621419, "ground_truth": 0}, {"key": "c136c209869b227e534aca60b6df7e0b26bce7fe", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.4902356210858517, "ground_truth": 0}, {"key": "c136c209869b227e534aca60b6df7e0b26bce7fe", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.41300359271271797, "ground_truth": 0}, {"key": "c136c209869b227e534aca60b6df7e0b26bce7fe", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.552539700075001, "ground_truth": 0}, {"key": "c136c209869b227e534aca60b6df7e0b26bce7fe", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.49609380702656497, "ground_truth": 0}, {"key": "bfbf2be3d5b9da8425253502393528d0f95d2b5d", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.6808786161860307, "ground_truth": 0}, {"key": "bfbf2be3d5b9da8425253502393528d0f95d2b5d", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.9219218347817758, "ground_truth": 0}, {"key": "bfbf2be3d5b9da8425253502393528d0f95d2b5d", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.7356416274979134, "ground_truth": 0}, {"key": "bfbf2be3d5b9da8425253502393528d0f95d2b5d", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.44939265756971764, "ground_truth": 0}, {"key": "bfbf2be3d5b9da8425253502393528d0f95d2b5d", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.8311430377261219, "ground_truth": 0}, {"key": "de149988c9768a12f4a656f1d86efe42af51b4c8", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.5506073602766587, "ground_truth": 0}, {"key": "de149988c9768a12f4a656f1d86efe42af51b4c8", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.3090236985682927, "ground_truth": 0}, {"key": "de149988c9768a12f4a656f1d86efe42af51b4c8", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.6424324807242238, "ground_truth": 0}, {"key": "de149988c9768a12f4a656f1d86efe42af51b4c8", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.27982849359385226, "ground_truth": 0}, {"key": "de149988c9768a12f4a656f1d86efe42af51b4c8", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.5736784221745289, "ground_truth": 0}, {"key": "45986f43dd61461844801c08c8753a71ccbf9083", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.531209348897572, "ground_truth": 0}, {"key": "45986f43dd61461844801c08c8753a71ccbf9083", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.5602526678037301, "ground_truth": 0}, {"key": "45986f43dd61461844801c08c8753a71ccbf9083", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.25982563741258835, "ground_truth": 0}, {"key": "45986f43dd61461844801c08c8753a71ccbf9083", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.2974699767037494, "ground_truth": 0}, {"key": "45986f43dd61461844801c08c8753a71ccbf9083", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.20946968670502034, "ground_truth": 0}, {"key": "e27256e1314f48219ceca70c273dd8429fc4ca4f", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.18359362457801456, "ground_truth": 0}, {"key": "e27256e1314f48219ceca70c273dd8429fc4ca4f", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.3380771399466718, "ground_truth": 0}, {"key": "e27256e1314f48219ceca70c273dd8429fc4ca4f", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.2877678098304525, "ground_truth": 0}, {"key": "e27256e1314f48219ceca70c273dd8429fc4ca4f", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.11757213846415229, "ground_truth": 0}, {"key": "e27256e1314f48219ceca70c273dd8429fc4ca4f", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.35756752892717103, "ground_truth": 0}, {"key": "8da9fddf6f4a0d798e454ee7b778ce0d7ce3c447", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.2782567950735572, "ground_truth": 0}, {"key": "8da9fddf6f4a0d798e454ee7b778ce0d7ce3c447", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.3380771384921872, "ground_truth": 0}, {"key": "8da9fddf6f4a0d798e454ee7b778ce0d7ce3c447", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.42823340956690537, "ground_truth": 0}, {"key": "8da9fddf6f4a0d798e454ee7b778ce0d7ce3c447", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.34864514364536126, "ground_truth": 0}, {"key": "8da9fddf6f4a0d798e454ee7b778ce0d7ce3c447", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.3611647153524749, "ground_truth": 0}, {"key": "d2e357c372891291bbdb4f496792ea9d5807cd3a", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.7879311986127516, "ground_truth": 0}, {"key": "d2e357c372891291bbdb4f496792ea9d5807cd3a", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.6315942893351841, "ground_truth": 0}, {"key": "d2e357c372891291bbdb4f496792ea9d5807cd3a", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.713830747826945, "ground_truth": 0}, {"key": "d2e357c372891291bbdb4f496792ea9d5807cd3a", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.4513265183897176, "ground_truth": 0}, {"key": "d2e357c372891291bbdb4f496792ea9d5807cd3a", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.48633153052098366, "ground_truth": 0}, {"key": "2a17cad6a35f54ceab81d03772a75c58aa7147ef", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.2227001448051861, "ground_truth": 0}, {"key": "2a17cad6a35f54ceab81d03772a75c58aa7147ef", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.20055767227030977, "ground_truth": 0}, {"key": "2a17cad6a35f54ceab81d03772a75c58aa7147ef", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.24077459545151686, "ground_truth": 0}, {"key": "2a17cad6a35f54ceab81d03772a75c58aa7147ef", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.14608724954138197, "ground_truth": 0}, {"key": "2a17cad6a35f54ceab81d03772a75c58aa7147ef", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.1581743562228001, "ground_truth": 0}, {"key": "4b25022fda48e7f91ab1459f1a6dca501318672e", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.3539863011007189, "ground_truth": 0}, {"key": "4b25022fda48e7f91ab1459f1a6dca501318672e", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.4726834534405722, "ground_truth": 0}, {"key": "4b25022fda48e7f91ab1459f1a6dca501318672e", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.46101678374438776, "ground_truth": 0}, {"key": "4b25022fda48e7f91ab1459f1a6dca501318672e", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.6740504801741038, "ground_truth": 0}, {"key": "4b25022fda48e7f91ab1459f1a6dca501318672e", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.24508502214774622, "ground_truth": 0}, {"key": "62066d76f4ef9e06a1129551c41371bb5d2f7465", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.5794003991209333, "ground_truth": 0}, {"key": "62066d76f4ef9e06a1129551c41371bb5d2f7465", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.8661325110165057, "ground_truth": 0}, {"key": "62066d76f4ef9e06a1129551c41371bb5d2f7465", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.817574470133175, "ground_truth": 0}, {"key": "62066d76f4ef9e06a1129551c41371bb5d2f7465", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.605799058455518, "ground_truth": 0}, {"key": "62066d76f4ef9e06a1129551c41371bb5d2f7465", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.7248702757756453, "ground_truth": 0}, {"key": "16c4a27e42066259797d93d5db0239bce0a15f18", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.45519861276900037, "ground_truth": 0}, {"key": "16c4a27e42066259797d93d5db0239bce0a15f18", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.23651622734302577, "ground_truth": 0}, {"key": "16c4a27e42066259797d93d5db0239bce0a15f18", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.5312094089338325, "ground_truth": 0}, {"key": "16c4a27e42066259797d93d5db0239bce0a15f18", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.6113819852134246, "ground_truth": 0}, {"key": "16c4a27e42066259797d93d5db0239bce0a15f18", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.2909808702251496, "ground_truth": 0}, {"key": "8626e8d0c96f4d12eca92423e0c43c6ea3e53545", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.1480471862385998, "ground_truth": 0}, {"key": "8626e8d0c96f4d12eca92423e0c43c6ea3e53545", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.20817892787829806, "ground_truth": 0}, {"key": "8626e8d0c96f4d12eca92423e0c43c6ea3e53545", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.25832599516810045, "ground_truth": 0}, {"key": "8626e8d0c96f4d12eca92423e0c43c6ea3e53545", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.2598256274395564, "ground_truth": 0}, {"key": "8626e8d0c96f4d12eca92423e0c43c6ea3e53545", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.1931473746301171, "ground_truth": 0}, {"key": "f675d806e17d1920e6622d3a925367697c94e58e", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.40922079502479924, "ground_truth": 0}, {"key": "f675d806e17d1920e6622d3a925367697c94e58e", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.564098469051327, "ground_truth": 0}, {"key": "f675d806e17d1920e6622d3a925367697c94e58e", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.3904758229379615, "ground_truth": 0}, {"key": "f675d806e17d1920e6622d3a925367697c94e58e", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.6297746280902695, "ground_truth": 0}, {"key": "f675d806e17d1920e6622d3a925367697c94e58e", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.4902356397266306, "ground_truth": 0}, {"key": "835b6e4637bd2c3fe2644f2cefa00270e950ebdf", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.08329192588732748, "ground_truth": 0}, {"key": "835b6e4637bd2c3fe2644f2cefa00270e950ebdf", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.177810871525866, "ground_truth": 0}, {"key": "835b6e4637bd2c3fe2644f2cefa00270e950ebdf", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.1847675104837394, "ground_truth": 0}, {"key": "835b6e4637bd2c3fe2644f2cefa00270e950ebdf", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.23651622611689277, "ground_truth": 0}, {"key": "835b6e4637bd2c3fe2644f2cefa00270e950ebdf", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.4610167735781877, "ground_truth": 0}, {"key": "aec90720358f66b9d149db8afd08fbb821e3aa52", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.2991051959920641, "ground_truth": 0}, {"key": "aec90720358f66b9d149db8afd08fbb821e3aa52", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.2814056090537393, "ground_truth": 0}, {"key": "aec90720358f66b9d149db8afd08fbb821e3aa52", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.04672496007786048, "ground_truth": 0}, {"key": "aec90720358f66b9d149db8afd08fbb821e3aa52", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.3942009420138795, "ground_truth": 0}, {"key": "aec90720358f66b9d149db8afd08fbb821e3aa52", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.19193279116890666, "ground_truth": 0}, {"key": "0033829349643e2964a8c3ce5fd997116ce43f7c", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.6424324820684075, "ground_truth": 0}, {"key": "0033829349643e2964a8c3ce5fd997116ce43f7c", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.6926419852374411, "ground_truth": 0}, {"key": "0033829349643e2964a8c3ce5fd997116ce43f7c", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.859663747384963, "ground_truth": 0}, {"key": "0033829349643e2964a8c3ce5fd997116ce43f7c", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.6477982122290353, "ground_truth": 0}, {"key": "0033829349643e2964a8c3ce5fd997116ce43f7c", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.8333245933664777, "ground_truth": 0}, {"key": "3276a47234f0aa9eb7d4d06940ffb912be059454", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.18359362998432244, "ground_truth": 0}, {"key": "3276a47234f0aa9eb7d4d06940ffb912be059454", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.30902371082645, "ground_truth": 0}, {"key": "3276a47234f0aa9eb7d4d06940ffb912be059454", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.2613309288402975, "ground_truth": 0}, {"key": "3276a47234f0aa9eb7d4d06940ffb912be059454", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.35577487291487225, "ground_truth": 0}, {"key": "3276a47234f0aa9eb7d4d06940ffb912be059454", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.14033623737702194, "ground_truth": 0}, {"key": "8d3bb51d711ce00e3fff53625a70923985573834", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.24077460283592883, "ground_truth": 0}, {"key": "8d3bb51d711ce00e3fff53625a70923985573834", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.27512972432158656, "ground_truth": 0}, {"key": "8d3bb51d711ce00e3fff53625a70923985573834", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.5813030772833528, "ground_truth": 0}, {"key": "8d3bb51d711ce00e3fff53625a70923985573834", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.5312093831751675, "ground_truth": 0}, {"key": "8d3bb51d711ce00e3fff53625a70923985573834", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.20307463036050338, "ground_truth": 0}, {"key": "e43fc7e34d05a75894279f55935b25040a6d7017", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.18010667052922155, "ground_truth": 0}, {"key": "e43fc7e34d05a75894279f55935b25040a6d7017", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.1159607143856281, "ground_truth": 0}, {"key": "e43fc7e34d05a75894279f55935b25040a6d7017", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.25683200713470145, "ground_truth": 0}, {"key": "e43fc7e34d05a75894279f55935b25040a6d7017", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.32594952517674397, "ground_truth": 0}, {"key": "e43fc7e34d05a75894279f55935b25040a6d7017", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.21733751349858263, "ground_truth": 0}, {"key": "518daa3f4d9f4eb8d3e6dec7852c8b645d1ceb49", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.3225260009822405, "ground_truth": 0}, {"key": "518daa3f4d9f4eb8d3e6dec7852c8b645d1ceb49", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.41869692902486405, "ground_truth": 0}, {"key": "518daa3f4d9f4eb8d3e6dec7852c8b645d1ceb49", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.2845760130918549, "ground_truth": 0}, {"key": "518daa3f4d9f4eb8d3e6dec7852c8b645d1ceb49", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.2379298984691166, "ground_truth": 0}, {"key": "518daa3f4d9f4eb8d3e6dec7852c8b645d1ceb49", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.18594720743408344, "ground_truth": 0}, {"key": "a86f10b66912e0221e9ad4d44c37fc7f4e138ed2", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.8116760107562678, "ground_truth": 0}, {"key": "a86f10b66912e0221e9ad4d44c37fc7f4e138ed2", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.8732148340962042, "ground_truth": 0}, {"key": "a86f10b66912e0221e9ad4d44c37fc7f4e138ed2", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.9591542817626039, "ground_truth": 0}, {"key": "a86f10b66912e0221e9ad4d44c37fc7f4e138ed2", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.937668962110032, "ground_truth": 0}, {"key": "a86f10b66912e0221e9ad4d44c37fc7f4e138ed2", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.954307969789756, "ground_truth": 0}, {"key": "a34829c5a83a3ef39c34b57b65cc48c9bf11f14b", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.28298812143906543, "ground_truth": 0}, {"key": "a34829c5a83a3ef39c34b57b65cc48c9bf11f14b", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.18832398705244432, "ground_truth": 0}, {"key": "a34829c5a83a3ef39c34b57b65cc48c9bf11f14b", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.0857092773560202, "ground_truth": 0}, {"key": "a34829c5a83a3ef39c34b57b65cc48c9bf11f14b", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.20307462918094243, "ground_truth": 0}, {"key": "a34829c5a83a3ef39c34b57b65cc48c9bf11f14b", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.13753247694952783, "ground_truth": 0}, {"key": "05c6b2a21f9c0ffd5f0c76c9ce4c6d3d875fcf39", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.22678363887611688, "ground_truth": 0}, {"key": "05c6b2a21f9c0ffd5f0c76c9ce4c6d3d875fcf39", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.6424324966682974, "ground_truth": 0}, {"key": "05c6b2a21f9c0ffd5f0c76c9ce4c6d3d875fcf39", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.18952109582967572, "ground_truth": 0}, {"key": "05c6b2a21f9c0ffd5f0c76c9ce4c6d3d875fcf39", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.4804786897267091, "ground_truth": 0}, {"key": "05c6b2a21f9c0ffd5f0c76c9ce4c6d3d875fcf39", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.5370413591448897, "ground_truth": 0}, {"key": "b3e6507640b009ed51c8c8f8be85d0b7fec5b579", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.704160129154421, "ground_truth": 0}, {"key": "b3e6507640b009ed51c8c8f8be85d0b7fec5b579", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.861538215874729, "ground_truth": 0}, {"key": "b3e6507640b009ed51c8c8f8be85d0b7fec5b579", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.7606506528623169, "ground_truth": 0}, {"key": "b3e6507640b009ed51c8c8f8be85d0b7fec5b579", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.7476159663000622, "ground_truth": 0}, {"key": "b3e6507640b009ed51c8c8f8be85d0b7fec5b579", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.5467381453632008, "ground_truth": 0}, {"key": "6e930c55a62640d218e4b94f39cb7c83b6ad9117", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.1259227675145933, "ground_truth": 0}, {"key": "6e930c55a62640d218e4b94f39cb7c83b6ad9117", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.10087862030629424, "ground_truth": 0}, {"key": "6e930c55a62640d218e4b94f39cb7c83b6ad9117", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.20434189337646125, "ground_truth": 0}, {"key": "6e930c55a62640d218e4b94f39cb7c83b6ad9117", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.1460872511444215, "ground_truth": 0}, {"key": "6e930c55a62640d218e4b94f39cb7c83b6ad9117", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.30239109147869286, "ground_truth": 0}, {"key": "cd13c83364964da3b3659782e6ef0d2b3dc273b1", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.1561048984117107, "ground_truth": 0}, {"key": "cd13c83364964da3b3659782e6ef0d2b3dc273b1", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.16776334217712932, "ground_truth": 0}, {"key": "cd13c83364964da3b3659782e6ef0d2b3dc273b1", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.43206339847517233, "ground_truth": 0}, {"key": "cd13c83364964da3b3659782e6ef0d2b3dc273b1", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.21076629610169834, "ground_truth": 0}, {"key": "cd13c83364964da3b3659782e6ef0d2b3dc273b1", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.5214711593725464, "ground_truth": 0}, {"key": "328210eaa50ae54cc3d979958c1d2008faa27401", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.4054487258352045, "ground_truth": 0}, {"key": "328210eaa50ae54cc3d979958c1d2008faa27401", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.39793841834201393, "ground_truth": 0}, {"key": "328210eaa50ae54cc3d979958c1d2008faa27401", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.2689414549202966, "ground_truth": 0}, {"key": "328210eaa50ae54cc3d979958c1d2008faa27401", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.32252599417859806, "ground_truth": 0}, {"key": "328210eaa50ae54cc3d979958c1d2008faa27401", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.29746994345039196, "ground_truth": 0}, {"key": "b67b63d1da9cccd6e229d5755065d57dd1653feb", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.2925953164573121, "ground_truth": 0}, {"key": "b67b63d1da9cccd6e229d5755065d57dd1653feb", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.29583987555567953, "ground_truth": 0}, {"key": "b67b63d1da9cccd6e229d5755065d57dd1653feb", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.5156199061397756, "ground_truth": 0}, {"key": "b67b63d1da9cccd6e229d5755065d57dd1653feb", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.6825737264296828, "ground_truth": 0}, {"key": "b67b63d1da9cccd6e229d5755065d57dd1653feb", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.5428632866331176, "ground_truth": 0}, {"key": "e4c55cb4bb6e5418d8486fb7c9369b6c84b2716d", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.30569733414444933, "ground_truth": 0}, {"key": "e4c55cb4bb6e5418d8486fb7c9369b6c84b2716d", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.3611647078304654, "ground_truth": 0}, {"key": "e4c55cb4bb6e5418d8486fb7c9369b6c84b2716d", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.2829881116653316, "ground_truth": 0}, {"key": "e4c55cb4bb6e5418d8486fb7c9369b6c84b2716d", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.26894143439996154, "ground_truth": 0}, {"key": "e4c55cb4bb6e5418d8486fb7c9369b6c84b2716d", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.27825679464020897, "ground_truth": 0}, {"key": "544b165ad1d22a5dcbbab469a2aa7666c2868361", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.17667159885202025, "ground_truth": 0}, {"key": "544b165ad1d22a5dcbbab469a2aa7666c2868361", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.22541661836810592, "ground_truth": 0}, {"key": "544b165ad1d22a5dcbbab469a2aa7666c2868361", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.09534946360041593, "ground_truth": 0}, {"key": "544b165ad1d22a5dcbbab469a2aa7666c2868361", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.08035746525702865, "ground_truth": 0}, {"key": "544b165ad1d22a5dcbbab469a2aa7666c2868361", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.1460872532374471, "ground_truth": 0}, {"key": "2577ef64a22c06cf63cb244abfad9ecc46603208", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.23651623907550223, "ground_truth": 0}, {"key": "2577ef64a22c06cf63cb244abfad9ecc46603208", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.20689405575710793, "ground_truth": 0}, {"key": "2577ef64a22c06cf63cb244abfad9ecc46603208", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.19682621508895973, "ground_truth": 0}, {"key": "2577ef64a22c06cf63cb244abfad9ecc46603208", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.12085323260195398, "ground_truth": 0}, {"key": "2577ef64a22c06cf63cb244abfad9ecc46603208", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.23370635333315262, "ground_truth": 0}, {"key": "2a73430dd3232ad3da7570a5ac133d7f29a6b6c6", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.6495786455453476, "ground_truth": 0}, {"key": "2a73430dd3232ad3da7570a5ac133d7f29a6b6c6", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.519521311723938, "ground_truth": 0}, {"key": "2a73430dd3232ad3da7570a5ac133d7f29a6b6c6", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.2782568097512285, "ground_truth": 0}, {"key": "2a73430dd3232ad3da7570a5ac133d7f29a6b6c6", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.07004896259698679, "ground_truth": 0}, {"key": "2a73430dd3232ad3da7570a5ac133d7f29a6b6c6", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.1259227677405836, "ground_truth": 0}, {"key": "8fbcaf3abc124b7baaa278d382411f43e7e48353", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.1120159529919256, "ground_truth": 0}, {"key": "8fbcaf3abc124b7baaa278d382411f43e7e48353", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.18594720080824753, "ground_truth": 0}, {"key": "8fbcaf3abc124b7baaa278d382411f43e7e48353", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.17781086726836928, "ground_truth": 0}, {"key": "8fbcaf3abc124b7baaa278d382411f43e7e48353", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.2798284995514576, "ground_truth": 0}, {"key": "8fbcaf3abc124b7baaa278d382411f43e7e48353", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.23651622820117427, "ground_truth": 0}, {"key": "bc04e5a298854589044eb5a162f281f3e7e12c16", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.07921032207601522, "ground_truth": 0}, {"key": "bc04e5a298854589044eb5a162f281f3e7e12c16", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.33982763039433866, "ground_truth": 0}, {"key": "bc04e5a298854589044eb5a162f281f3e7e12c16", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.19682620540184836, "ground_truth": 0}, {"key": "bc04e5a298854589044eb5a162f281f3e7e12c16", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.12592276705521321, "ground_truth": 0}, {"key": "bc04e5a298854589044eb5a162f281f3e7e12c16", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.3225259973369765, "ground_truth": 0}, {"key": "8c3b7358950d0684a90736fc39d08340d3ec41ee", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.4282333996159694, "ground_truth": 0}, {"key": "8c3b7358950d0684a90736fc39d08340d3ec41ee", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.18713268308078437, "ground_truth": 0}, {"key": "8c3b7358950d0684a90736fc39d08340d3ec41ee", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.1955940733029542, "ground_truth": 0}, {"key": "8c3b7358950d0684a90736fc39d08340d3ec41ee", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.2942149651298241, "ground_truth": 0}, {"key": "8c3b7358950d0684a90736fc39d08340d3ec41ee", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.16238003735623208, "ground_truth": 0}, {"key": "d1a86381ca59e3471d2863688229922f83218150", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.5945512745410442, "ground_truth": 0}, {"key": "d1a86381ca59e3471d2863688229922f83218150", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.8044059095957544, "ground_truth": 0}, {"key": "d1a86381ca59e3471d2863688229922f83218150", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.3904758405123758, "ground_truth": 0}, {"key": "d1a86381ca59e3471d2863688229922f83218150", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.6566582531760237, "ground_truth": 0}, {"key": "d1a86381ca59e3471d2863688229922f83218150", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.7170118760364885, "ground_truth": 0}, {"key": "313d98f4c6047ff556795b6da47e42e9f650946a", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.44552953100438974, "ground_truth": 0}, {"key": "313d98f4c6047ff556795b6da47e42e9f650946a", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.20181323255821285, "ground_truth": 0}, {"key": "313d98f4c6047ff556795b6da47e42e9f650946a", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.051845465311314655, "ground_truth": 0}, {"key": "313d98f4c6047ff556795b6da47e42e9f650946a", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.2613309177243628, "ground_truth": 0}, {"key": "313d98f4c6047ff556795b6da47e42e9f650946a", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.30239109301738537, "ground_truth": 0}, {"key": "8c0934c689bbc9234dc51eff9d8d156aec106ca4", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.60579906664111, "ground_truth": 0}, {"key": "8c0934c689bbc9234dc51eff9d8d156aec106ca4", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.9066531185190853, "ground_truth": 0}, {"key": "8c0934c689bbc9234dc51eff9d8d156aec106ca4", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.4205995859507043, "ground_truth": 0}, {"key": "8c0934c689bbc9234dc51eff9d8d156aec106ca4", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.6315942830743887, "ground_truth": 0}, {"key": "8c0934c689bbc9234dc51eff9d8d156aec106ca4", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.7431680055241158, "ground_truth": 0}, {"key": "70f210b63211c32ab22354506b7bd9b80ee194af", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.6297746057737539, "ground_truth": 0}, {"key": "70f210b63211c32ab22354506b7bd9b80ee194af", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.2720245733448685, "ground_truth": 0}, {"key": "70f210b63211c32ab22354506b7bd9b80ee194af", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.5, "ground_truth": 0}, {"key": "70f210b63211c32ab22354506b7bd9b80ee194af", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.4571367361033532, "ground_truth": 0}, {"key": "70f210b63211c32ab22354506b7bd9b80ee194af", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.7310585483306556, "ground_truth": 0}, {"key": "dea4bf4a53b568dea8b3d5009a24d090485be8c9", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.4244119917360062, "ground_truth": 0}, {"key": "dea4bf4a53b568dea8b3d5009a24d090485be8c9", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.7620700867598711, "ground_truth": 0}, {"key": "dea4bf4a53b568dea8b3d5009a24d090485be8c9", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.42250461786193283, "ground_truth": 0}, {"key": "dea4bf4a53b568dea8b3d5009a24d090485be8c9", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.6242935217214155, "ground_truth": 0}, {"key": "dea4bf4a53b568dea8b3d5009a24d090485be8c9", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.7074046812859163, "ground_truth": 0}, {"key": "3ffb4210cf832dc039ffe7522c47c6eb7a5e5ab5", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.03594832422255272, "ground_truth": 0}, {"key": "3ffb4210cf832dc039ffe7522c47c6eb7a5e5ab5", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.1451153597859632, "ground_truth": 0}, {"key": "3ffb4210cf832dc039ffe7522c47c6eb7a5e5ab5", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.13939637966052615, "ground_truth": 0}, {"key": "3ffb4210cf832dc039ffe7522c47c6eb7a5e5ab5", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.08632347616164077, "ground_truth": 0}, {"key": "3ffb4210cf832dc039ffe7522c47c6eb7a5e5ab5", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.15610490278303066, "ground_truth": 0}, {"key": "c010d72bf64ac4e1c758b7f078aeed89bc57a9db", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.4416730163599132, "ground_truth": 0}, {"key": "c010d72bf64ac4e1c758b7f078aeed89bc57a9db", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.3867634385428604, "ground_truth": 0}, {"key": "c010d72bf64ac4e1c758b7f078aeed89bc57a9db", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.18594720368829992, "ground_truth": 0}, {"key": "c010d72bf64ac4e1c758b7f078aeed89bc57a9db", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.42632157759680633, "ground_truth": 0}, {"key": "c010d72bf64ac4e1c758b7f078aeed89bc57a9db", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.6076631663173946, "ground_truth": 0}, {"key": "343644770a597a2dfa7548ba165fa9c6bdc88245", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.6495786270310183, "ground_truth": 0}, {"key": "343644770a597a2dfa7548ba165fa9c6bdc88245", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.5660185366957751, "ground_truth": 0}, {"key": "343644770a597a2dfa7548ba165fa9c6bdc88245", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.15610490934294097, "ground_truth": 0}, {"key": "343644770a597a2dfa7548ba165fa9c6bdc88245", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.6334102553449488, "ground_truth": 0}, {"key": "343644770a597a2dfa7548ba165fa9c6bdc88245", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.49414088975833437, "ground_truth": 0}, {"key": "4b89e8a6a25de61d21a1fed20fb911cd4b1e4b47", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.3867634468554783, "ground_truth": 0}, {"key": "4b89e8a6a25de61d21a1fed20fb911cd4b1e4b47", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.40733336287094973, "ground_truth": 0}, {"key": "4b89e8a6a25de61d21a1fed20fb911cd4b1e4b47", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.2814055939886643, "ground_truth": 0}, {"key": "4b89e8a6a25de61d21a1fed20fb911cd4b1e4b47", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.3611647034804802, "ground_truth": 0}, {"key": "4b89e8a6a25de61d21a1fed20fb911cd4b1e4b47", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.38121957721566463, "ground_truth": 0}, {"key": "9b382d27692cb18aa61af350038b175b3ce75e2b", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.1015894533707163, "ground_truth": 0}, {"key": "9b382d27692cb18aa61af350038b175b3ce75e2b", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.09877258691658294, "ground_truth": 0}, {"key": "9b382d27692cb18aa61af350038b175b3ce75e2b", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.3023910874109212, "ground_truth": 0}, {"key": "9b382d27692cb18aa61af350038b175b3ce75e2b", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.04778006865985976, "ground_truth": 0}, {"key": "9b382d27692cb18aa61af350038b175b3ce75e2b", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.10970577213011334, "ground_truth": 0}, {"key": "59be27355e5b86754678f70254cfbb1e6dc8bf0c", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.7401743751488719, "ground_truth": 0}, {"key": "59be27355e5b86754678f70254cfbb1e6dc8bf0c", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.6057990199770956, "ground_truth": 0}, {"key": "59be27355e5b86754678f70254cfbb1e6dc8bf0c", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.4378234852455387, "ground_truth": 0}, {"key": "59be27355e5b86754678f70254cfbb1e6dc8bf0c", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.2925952884304673, "ground_truth": 0}, {"key": "59be27355e5b86754678f70254cfbb1e6dc8bf0c", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.560252645440839, "ground_truth": 0}, {"key": "ff10934c1dc127286575fb1a6b192da6da21f235", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.4785288648243994, "ground_truth": 0}, {"key": "ff10934c1dc127286575fb1a6b192da6da21f235", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.4629586127902157, "ground_truth": 0}, {"key": "ff10934c1dc127286575fb1a6b192da6da21f235", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.11676400756704305, "ground_truth": 0}, {"key": "ff10934c1dc127286575fb1a6b192da6da21f235", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.5964331314509022, "ground_truth": 0}, {"key": "ff10934c1dc127286575fb1a6b192da6da21f235", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.5506073444297596, "ground_truth": 0}, {"key": "1997690ceabc952c3396cb2a30e9050241f6f6c7", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.36116473491528567, "ground_truth": 0}, {"key": "1997690ceabc952c3396cb2a30e9050241f6f6c7", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.12592276866159557, "ground_truth": 0}, {"key": "1997690ceabc952c3396cb2a30e9050241f6f6c7", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.18126320771023535, "ground_truth": 0}, {"key": "1997690ceabc952c3396cb2a30e9050241f6f6c7", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.23091974825671482, "ground_truth": 0}, {"key": "1997690ceabc952c3396cb2a30e9050241f6f6c7", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.16132023470210843, "ground_truth": 0}, {"key": "c676027eea6109621206e3864c4eea30912fe09f", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.16238002574245566, "ground_truth": 0}, {"key": "c676027eea6109621206e3864c4eea30912fe09f", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.22270014369547522, "ground_truth": 0}, {"key": "c676027eea6109621206e3864c4eea30912fe09f", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.14804718843122625, "ground_truth": 0}, {"key": "c676027eea6109621206e3864c4eea30912fe09f", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.3276683069769478, "ground_truth": 0}, {"key": "c676027eea6109621206e3864c4eea30912fe09f", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.4073334151797592, "ground_truth": 0}, {"key": "78e22dd79495204cf719e3728927241bb60b80e1", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.2909808680995419, "ground_truth": 0}, {"key": "78e22dd79495204cf719e3728927241bb60b80e1", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.3056973211329595, "ground_truth": 0}, {"key": "78e22dd79495204cf719e3728927241bb60b80e1", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.39606817357892815, "ground_truth": 0}, {"key": "78e22dd79495204cf719e3728927241bb60b80e1", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.32423539005588853, "ground_truth": 0}, {"key": "78e22dd79495204cf719e3728927241bb60b80e1", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.4610167906454262, "ground_truth": 0}, {"key": "6c1a1cf59028ba2567b0a1941e510c40133da1c0", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.250912790432171, "ground_truth": 0}, {"key": "6c1a1cf59028ba2567b0a1941e510c40133da1c0", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.5525397004353455, "ground_truth": 0}, {"key": "6c1a1cf59028ba2567b0a1941e510c40133da1c0", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.22135068881706016, "ground_truth": 0}, {"key": "6c1a1cf59028ba2567b0a1941e510c40133da1c0", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.26284185613768707, "ground_truth": 0}, {"key": "6c1a1cf59028ba2567b0a1941e510c40133da1c0", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.3208213051261356, "ground_truth": 0}, {"key": "e8bbd5a77edf96611a4b8efcfbc625ec65985e98", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.047780066698592596, "ground_truth": 0}, {"key": "e8bbd5a77edf96611a4b8efcfbc625ec65985e98", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.20817892488765058, "ground_truth": 0}, {"key": "e8bbd5a77edf96611a4b8efcfbc625ec65985e98", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.11838509314273157, "ground_truth": 0}, {"key": "e8bbd5a77edf96611a4b8efcfbc625ec65985e98", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.6039318273518205, "ground_truth": 0}, {"key": "e8bbd5a77edf96611a4b8efcfbc625ec65985e98", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.47463117617137485, "ground_truth": 0}, {"key": "4141e012912dbf29c5e792b8654a9a36094b468c", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.12085323221263591, "ground_truth": 0}, {"key": "4141e012912dbf29c5e792b8654a9a36094b468c", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.22953520294936644, "ground_truth": 0}, {"key": "4141e012912dbf29c5e792b8654a9a36094b468c", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.29583986673112994, "ground_truth": 0}, {"key": "4141e012912dbf29c5e792b8654a9a36094b468c", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.38306416417047884, "ground_truth": 0}, {"key": "4141e012912dbf29c5e792b8654a9a36094b468c", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.1602660402368086, "ground_truth": 0}, {"key": "d80fa94dc14601e4b82321e2cf749d6915251a70", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.37022538687974205, "ground_truth": 0}, {"key": "d80fa94dc14601e4b82321e2cf749d6915251a70", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.3345894431434738, "ground_truth": 0}, {"key": "d80fa94dc14601e4b82321e2cf749d6915251a70", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.14128141651567577, "ground_truth": 0}, {"key": "d80fa94dc14601e4b82321e2cf749d6915251a70", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.273574394563712, "ground_truth": 0}, {"key": "d80fa94dc14601e4b82321e2cf749d6915251a70", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.5964331369160155, "ground_truth": 0}, {"key": "11e57b8ed79c4f4b110d81a5cd7152d42411c7a6", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.10374863528078888, "ground_truth": 0}, {"key": "11e57b8ed79c4f4b110d81a5cd7152d42411c7a6", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.11201595481615596, "ground_truth": 0}, {"key": "11e57b8ed79c4f4b110d81a5cd7152d42411c7a6", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.1732882031819768, "ground_truth": 0}, {"key": "11e57b8ed79c4f4b110d81a5cd7152d42411c7a6", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.2186693838192778, "ground_truth": 0}, {"key": "11e57b8ed79c4f4b110d81a5cd7152d42411c7a6", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.24364245996209677, "ground_truth": 0}, {"key": "b55c390e81c5d1d4fa077338d9daaed8978f710b", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.34687307427118075, "ground_truth": 0}, {"key": "b55c390e81c5d1d4fa077338d9daaed8978f710b", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.2523840552457982, "ground_truth": 0}, {"key": "b55c390e81c5d1d4fa077338d9daaed8978f710b", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.35220177841524397, "ground_truth": 0}, {"key": "b55c390e81c5d1d4fa077338d9daaed8978f710b", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.6001883476384292, "ground_truth": 0}, {"key": "b55c390e81c5d1d4fa077338d9daaed8978f710b", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.2751297256112122, "ground_truth": 0}, {"key": "d46e1849cbbf875ccd018fd778fa6c433cab4694", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.26894143510772395, "ground_truth": 0}, {"key": "d46e1849cbbf875ccd018fd778fa6c433cab4694", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.19682621074850404, "ground_truth": 0}, {"key": "d46e1849cbbf875ccd018fd778fa6c433cab4694", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.5097643868028154, "ground_truth": 0}, {"key": "d46e1849cbbf875ccd018fd778fa6c433cab4694", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.3757064723103443, "ground_truth": 0}, {"key": "d46e1849cbbf875ccd018fd778fa6c433cab4694", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.3225259708761413, "ground_truth": 0}, {"key": "09b582acc63514f671628e1766ff7e99b258fe9a", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.3904758262887601, "ground_truth": 0}, {"key": "09b582acc63514f671628e1766ff7e99b258fe9a", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.28298812912592436, "ground_truth": 0}, {"key": "09b582acc63514f671628e1766ff7e99b258fe9a", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.2583259743385797, "ground_truth": 0}, {"key": "09b582acc63514f671628e1766ff7e99b258fe9a", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.3775406617115713, "ground_truth": 0}, {"key": "09b582acc63514f671628e1766ff7e99b258fe9a", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.3106943912517617, "ground_truth": 0}, {"key": "c4afe4db222c094c40bb3f271e37e006bcbebf88", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.3023910888761481, "ground_truth": 0}, {"key": "c4afe4db222c094c40bb3f271e37e006bcbebf88", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.3665897285619251, "ground_truth": 0}, {"key": "c4afe4db222c094c40bb3f271e37e006bcbebf88", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.13660839543871073, "ground_truth": 0}, {"key": "c4afe4db222c094c40bb3f271e37e006bcbebf88", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.39420094397075045, "ground_truth": 0}, {"key": "c4afe4db222c094c40bb3f271e37e006bcbebf88", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.30404169276210097, "ground_truth": 0}, {"key": "e21871892c63ec9638bf1bd3c3a1c3ebdae88796", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.09602549727521711, "ground_truth": 0}, {"key": "e21871892c63ec9638bf1bd3c3a1c3ebdae88796", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.4513265118248427, "ground_truth": 0}, {"key": "e21871892c63ec9638bf1bd3c3a1c3ebdae88796", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.20817893411479416, "ground_truth": 0}, {"key": "e21871892c63ec9638bf1bd3c3a1c3ebdae88796", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.16451645869751014, "ground_truth": 0}, {"key": "e21871892c63ec9638bf1bd3c3a1c3ebdae88796", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.1755380611824914, "ground_truth": 0}, {"key": "065378e265a6d5ff38b2e6748ba66490cf8670a9", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.2751297241986361, "ground_truth": 0}, {"key": "065378e265a6d5ff38b2e6748ba66490cf8670a9", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.21733752074330023, "ground_truth": 0}, {"key": "065378e265a6d5ff38b2e6748ba66490cf8670a9", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.13117322217623675, "ground_truth": 0}, {"key": "065378e265a6d5ff38b2e6748ba66490cf8670a9", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.42823338833444136, "ground_truth": 0}, {"key": "065378e265a6d5ff38b2e6748ba66490cf8670a9", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.36658973984296667, "ground_truth": 0}, {"key": "5852e143b34cc30e94aed29193fc2e1dce37b1b1", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.3276682993104249, "ground_truth": 0}, {"key": "5852e143b34cc30e94aed29193fc2e1dce37b1b1", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.28616924568474617, "ground_truth": 0}, {"key": "5852e143b34cc30e94aed29193fc2e1dce37b1b1", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.23510838848316148, "ground_truth": 0}, {"key": "5852e143b34cc30e94aed29193fc2e1dce37b1b1", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.2337063409452209, "ground_truth": 0}, {"key": "5852e143b34cc30e94aed29193fc2e1dce37b1b1", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.1451153598836098, "ground_truth": 0}, {"key": "af76b4c33b65666487dcc07f75d37de03ff61207", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.10158945016548136, "ground_truth": 0}, {"key": "af76b4c33b65666487dcc07f75d37de03ff61207", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.171061178627201, "ground_truth": 0}, {"key": "af76b4c33b65666487dcc07f75d37de03ff61207", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.02887090760501849, "ground_truth": 0}, {"key": "af76b4c33b65666487dcc07f75d37de03ff61207", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.24077461042891057, "ground_truth": 0}, {"key": "af76b4c33b65666487dcc07f75d37de03ff61207", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.5253687948474767, "ground_truth": 0}, {"key": "9918924dbaed44429c58ea3638c3847317b71127", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.37570648637809967, "ground_truth": 0}, {"key": "9918924dbaed44429c58ea3638c3847317b71127", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.6723317078855526, "ground_truth": 0}, {"key": "9918924dbaed44429c58ea3638c3847317b71127", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.6242935577534496, "ground_truth": 0}, {"key": "9918924dbaed44429c58ea3638c3847317b71127", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.3345894433559778, "ground_truth": 0}, {"key": "9918924dbaed44429c58ea3638c3847317b71127", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.7401743612069613, "ground_truth": 0}, {"key": "c87e99f422b46c03ce77e7cd064bff87c076e1ed", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.09947020921939306, "ground_truth": 0}, {"key": "c87e99f422b46c03ce77e7cd064bff87c076e1ed", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.10894504100880288, "ground_truth": 0}, {"key": "c87e99f422b46c03ce77e7cd064bff87c076e1ed", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.12168575908876697, "ground_truth": 0}, {"key": "c87e99f422b46c03ce77e7cd064bff87c076e1ed", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.1302854308600212, "ground_truth": 0}, {"key": "c87e99f422b46c03ce77e7cd064bff87c076e1ed", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.09534945983081859, "ground_truth": 0}, {"key": "aaca402152fbea1b16e14999374f6394520289a8", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.3023910972959222, "ground_truth": 0}, {"key": "aaca402152fbea1b16e14999374f6394520289a8", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.5389832076366808, "ground_truth": 0}, {"key": "aaca402152fbea1b16e14999374f6394520289a8", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.8757869973393665, "ground_truth": 0}, {"key": "aaca402152fbea1b16e14999374f6394520289a8", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.5736784214099202, "ground_truth": 0}, {"key": "aaca402152fbea1b16e14999374f6394520289a8", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.5292633750505981, "ground_truth": 0}, {"key": "259d8cccfcb9b9edc00d757ec6efecde6fc06110", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.2877678204510592, "ground_truth": 0}, {"key": "259d8cccfcb9b9edc00d757ec6efecde6fc06110", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.5583269776001857, "ground_truth": 0}, {"key": "259d8cccfcb9b9edc00d757ec6efecde6fc06110", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.36296919091568636, "ground_truth": 0}, {"key": "259d8cccfcb9b9edc00d757ec6efecde6fc06110", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.45907614123730384, "ground_truth": 0}, {"key": "259d8cccfcb9b9edc00d757ec6efecde6fc06110", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.2925953113397236, "ground_truth": 0}, {"key": "d076dbce6e84b20153db61c809d0f01f46ef1f45", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.20434190306844113, "ground_truth": 0}, {"key": "d076dbce6e84b20153db61c809d0f01f46ef1f45", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.1931473770775142, "ground_truth": 0}, {"key": "d076dbce6e84b20153db61c809d0f01f46ef1f45", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.36296922147083904, "ground_truth": 0}, {"key": "d076dbce6e84b20153db61c809d0f01f46ef1f45", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.1267851738229877, "ground_truth": 0}, {"key": "d076dbce6e84b20153db61c809d0f01f46ef1f45", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.37387581011026, "ground_truth": 0}, {"key": "c74e983d24450ed9c4ba3a97e345bba707d26853", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.7592253914020802, "ground_truth": 0}, {"key": "c74e983d24450ed9c4ba3a97e345bba707d26853", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.5019531008272707, "ground_truth": 0}, {"key": "c74e983d24450ed9c4ba3a97e345bba707d26853", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.5292633890101247, "ground_truth": 0}, {"key": "c74e983d24450ed9c4ba3a97e345bba707d26853", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.47268349673334514, "ground_truth": 0}, {"key": "c74e983d24450ed9c4ba3a97e345bba707d26853", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.4455295343388757, "ground_truth": 0}, {"key": "0922357b2d0439cf4ba6ec9dc143e11a38b49d8a", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.3575675252842235, "ground_truth": 0}, {"key": "0922357b2d0439cf4ba6ec9dc143e11a38b49d8a", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.6169358536241957, "ground_truth": 0}, {"key": "0922357b2d0439cf4ba6ec9dc143e11a38b49d8a", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.5136684756162387, "ground_truth": 0}, {"key": "0922357b2d0439cf4ba6ec9dc143e11a38b49d8a", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.2393493438975991, "ground_truth": 0}, {"key": "0922357b2d0439cf4ba6ec9dc143e11a38b49d8a", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.5717666174434871, "ground_truth": 0}, {"key": "c62ea6aaf31a7f5b6a7c2eac7780c86f9baed786", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.07807816249716046, "ground_truth": 0}, {"key": "c62ea6aaf31a7f5b6a7c2eac7780c86f9baed786", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.7786493132072992, "ground_truth": 0}, {"key": "c62ea6aaf31a7f5b6a7c2eac7780c86f9baed786", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.2133771758813402, "ground_truth": 0}, {"key": "c62ea6aaf31a7f5b6a7c2eac7780c86f9baed786", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.12678516155955505, "ground_truth": 0}, {"key": "c62ea6aaf31a7f5b6a7c2eac7780c86f9baed786", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.33458943724671647, "ground_truth": 0}, {"key": "6bb04883f35820a450ff821eda46a4002c0fc7e9", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.5964331332704511, "ground_truth": 0}, {"key": "6bb04883f35820a450ff821eda46a4002c0fc7e9", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.45907613204258313, "ground_truth": 0}, {"key": "6bb04883f35820a450ff821eda46a4002c0fc7e9", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.23651623695889115, "ground_truth": 0}, {"key": "6bb04883f35820a450ff821eda46a4002c0fc7e9", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.49023561251315256, "ground_truth": 0}, {"key": "6bb04883f35820a450ff821eda46a4002c0fc7e9", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.5175708827916149, "ground_truth": 0}, {"key": "71f87a7cbda73f1c0656d811b0026437e4ee4aa0", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.21337716904684847, "ground_truth": 0}, {"key": "71f87a7cbda73f1c0656d811b0026437e4ee4aa0", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.37754066861847774, "ground_truth": 0}, {"key": "71f87a7cbda73f1c0656d811b0026437e4ee4aa0", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.6279512018516054, "ground_truth": 0}, {"key": "71f87a7cbda73f1c0656d811b0026437e4ee4aa0", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.3942009514650417, "ground_truth": 0}, {"key": "71f87a7cbda73f1c0656d811b0026437e4ee4aa0", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.43398147914040575, "ground_truth": 0}, {"key": "fa5089d759a9fb810d28c140cf60e3a5fffff8ba", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.23231014026039165, "ground_truth": 0}, {"key": "fa5089d759a9fb810d28c140cf60e3a5fffff8ba", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.18242553277576273, "ground_truth": 0}, {"key": "fa5089d759a9fb810d28c140cf60e3a5fffff8ba", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.2160115361648825, "ground_truth": 0}, {"key": "fa5089d759a9fb810d28c140cf60e3a5fffff8ba", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.20434191066106, "ground_truth": 0}, {"key": "fa5089d759a9fb810d28c140cf60e3a5fffff8ba", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.39047584768461135, "ground_truth": 0}, {"key": "1f9aed77465301d7f3787a29555754a03728c4b7", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.7759445338924293, "ground_truth": 0}, {"key": "1f9aed77465301d7f3787a29555754a03728c4b7", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.14414886123713028, "ground_truth": 0}, {"key": "1f9aed77465301d7f3787a29555754a03728c4b7", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.8386797672329286, "ground_truth": 0}, {"key": "1f9aed77465301d7f3787a29555754a03728c4b7", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.61878043338118, "ground_truth": 0}, {"key": "1f9aed77465301d7f3787a29555754a03728c4b7", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.30569731653326787, "ground_truth": 0}, {"key": "7237201bcb7291f2ededb818f901a451356db34b", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.20181322268284477, "ground_truth": 0}, {"key": "7237201bcb7291f2ededb818f901a451356db34b", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.3090237011105609, "ground_truth": 0}, {"key": "7237201bcb7291f2ededb818f901a451356db34b", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.19072401581721055, "ground_truth": 0}, {"key": "7237201bcb7291f2ededb818f901a451356db34b", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.1393963886808651, "ground_truth": 0}, {"key": "7237201bcb7291f2ededb818f901a451356db34b", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.32939171235052317, "ground_truth": 0}, {"key": "38d13d78fedc889784ffb3cb213a758c758be145", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.06512754817481987, "ground_truth": 0}, {"key": "38d13d78fedc889784ffb3cb213a758c758be145", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.6169358536241957, "ground_truth": 0}, {"key": "38d13d78fedc889784ffb3cb213a758c758be145", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.40168780561658524, "ground_truth": 0}, {"key": "38d13d78fedc889784ffb3cb213a758c758be145", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.36658973460033595, "ground_truth": 0}, {"key": "38d13d78fedc889784ffb3cb213a758c758be145", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.8244619289016091, "ground_truth": 0}, {"key": "98fd4b91ec12241a96493471a3e21c9ab96ec523", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.25683200367508635, "ground_truth": 0}, {"key": "98fd4b91ec12241a96493471a3e21c9ab96ec523", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.3812195771028119, "ground_truth": 0}, {"key": "98fd4b91ec12241a96493471a3e21c9ab96ec523", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.4397473590200329, "ground_truth": 0}, {"key": "98fd4b91ec12241a96493471a3e21c9ab96ec523", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.4882833846698681, "ground_truth": 0}, {"key": "98fd4b91ec12241a96493471a3e21c9ab96ec523", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.18594721224826224, "ground_truth": 0}, {"key": "8cefdd23a829375abeb18b9bd44bb053a67dfdf8", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.17553807465610557, "ground_truth": 0}, {"key": "8cefdd23a829375abeb18b9bd44bb053a67dfdf8", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.3702254049333069, "ground_truth": 0}, {"key": "8cefdd23a829375abeb18b9bd44bb053a67dfdf8", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.4843800824490942, "ground_truth": 0}, {"key": "8cefdd23a829375abeb18b9bd44bb053a67dfdf8", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.15405754801032454, "ground_truth": 0}, {"key": "8cefdd23a829375abeb18b9bd44bb053a67dfdf8", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.39420095923263754, "ground_truth": 0}, {"key": "3de916a84cae6c1dee0076f4e5d6e26fc95c3242", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.46879059593719385, "ground_truth": 0}, {"key": "3de916a84cae6c1dee0076f4e5d6e26fc95c3242", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.5851011324523756, "ground_truth": 0}, {"key": "3de916a84cae6c1dee0076f4e5d6e26fc95c3242", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.5583270050180988, "ground_truth": 0}, {"key": "3de916a84cae6c1dee0076f4e5d6e26fc95c3242", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.5945512590523203, "ground_truth": 0}, {"key": "3de916a84cae6c1dee0076f4e5d6e26fc95c3242", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.47268347485971424, "ground_truth": 0}, {"key": "24611abacb038c28a84c76b10165e474ac0fdd7e", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.3793784026034146, "ground_truth": 0}, {"key": "24611abacb038c28a84c76b10165e474ac0fdd7e", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.20307462451588063, "ground_truth": 0}, {"key": "24611abacb038c28a84c76b10165e474ac0fdd7e", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.19806417817783598, "ground_truth": 0}, {"key": "24611abacb038c28a84c76b10165e474ac0fdd7e", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.373875818016633, "ground_truth": 0}, {"key": "24611abacb038c28a84c76b10165e474ac0fdd7e", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.2213506925060876, "ground_truth": 0}, {"key": "4f3178963b84a0e3625f7486b045872c665073d7", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.34687308218503704, "ground_truth": 0}, {"key": "4f3178963b84a0e3625f7486b045872c665073d7", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.3522017769578094, "ground_truth": 0}, {"key": "4f3178963b84a0e3625f7486b045872c665073d7", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.7122321904858241, "ground_truth": 0}, {"key": "4f3178963b84a0e3625f7486b045872c665073d7", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.38676342392089885, "ground_truth": 0}, {"key": "4f3178963b84a0e3625f7486b045872c665073d7", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.759225407472581, "ground_truth": 0}, {"key": "6ff0470115b556c80229f4305c23afa683c9f8da", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.21337717193808228, "ground_truth": 0}, {"key": "6ff0470115b556c80229f4305c23afa683c9f8da", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.20946969852488576, "ground_truth": 0}, {"key": "6ff0470115b556c80229f4305c23afa683c9f8da", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.46101678815873887, "ground_truth": 0}, {"key": "6ff0470115b556c80229f4305c23afa683c9f8da", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.12506538728855635, "ground_truth": 0}, {"key": "6ff0470115b556c80229f4305c23afa683c9f8da", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.18713268196608204, "ground_truth": 0}, {"key": "4be9a7e5e9115eb681541c4a8d247ac84f0eb774", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.16344543226380567, "ground_truth": 0}, {"key": "4be9a7e5e9115eb681541c4a8d247ac84f0eb774", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.5195213246293092, "ground_truth": 0}, {"key": "4be9a7e5e9115eb681541c4a8d247ac84f0eb774", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.23651623632388502, "ground_truth": 0}, {"key": "4be9a7e5e9115eb681541c4a8d247ac84f0eb774", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.5273165312640465, "ground_truth": 0}, {"key": "4be9a7e5e9115eb681541c4a8d247ac84f0eb774", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.492188144276797, "ground_truth": 0}, {"key": "de3ba4e29501a10effcbb5a61e7b9c0ab3721669", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.4785288270287414, "ground_truth": 0}, {"key": "de3ba4e29501a10effcbb5a61e7b9c0ab3721669", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.8879840448533438, "ground_truth": 0}, {"key": "de3ba4e29501a10effcbb5a61e7b9c0ab3721669", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.5389832013419593, "ground_truth": 0}, {"key": "de3ba4e29501a10effcbb5a61e7b9c0ab3721669", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.40922078707595444, "ground_truth": 0}, {"key": "de3ba4e29501a10effcbb5a61e7b9c0ab3721669", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.8300437614596132, "ground_truth": 0}, {"key": "d23090b75384c925e7f20b1ec5218394b52eae38", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.3593641389312223, "ground_truth": 0}, {"key": "d23090b75384c925e7f20b1ec5218394b52eae38", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.4980468765456806, "ground_truth": 0}, {"key": "d23090b75384c925e7f20b1ec5218394b52eae38", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.3904758312745535, "ground_truth": 0}, {"key": "d23090b75384c925e7f20b1ec5218394b52eae38", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.348645140847879, "ground_truth": 0}, {"key": "d23090b75384c925e7f20b1ec5218394b52eae38", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.5926665930311487, "ground_truth": 0}, {"key": "98008fdd5ea99bc7c437d6e1aa86c750bf667415", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.5888891513464298, "ground_truth": 0}, {"key": "98008fdd5ea99bc7c437d6e1aa86c750bf667415", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.24944723138851502, "ground_truth": 0}, {"key": "98008fdd5ea99bc7c437d6e1aa86c750bf667415", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.2958398631877376, "ground_truth": 0}, {"key": "98008fdd5ea99bc7c437d6e1aa86c750bf667415", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.3242353942751351, "ground_truth": 0}, {"key": "98008fdd5ea99bc7c437d6e1aa86c750bf667415", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.2925953184402347, "ground_truth": 0}, {"key": "fd13c81373473f862d0f3559ffbc2a03fa95f492", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.23934933690734958, "ground_truth": 0}, {"key": "fd13c81373473f862d0f3559ffbc2a03fa95f492", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.3293917140997672, "ground_truth": 0}, {"key": "fd13c81373473f862d0f3559ffbc2a03fa95f492", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.16132024716151894, "ground_truth": 0}, {"key": "fd13c81373473f862d0f3559ffbc2a03fa95f492", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.41679661717078803, "ground_truth": 0}, {"key": "fd13c81373473f862d0f3559ffbc2a03fa95f492", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.07316472373209282, "ground_truth": 0}, {"key": "ad275932d9fb03762cc781e06955fb088e165ad9", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.5888891285995353, "ground_truth": 0}, {"key": "ad275932d9fb03762cc781e06955fb088e165ad9", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.06656918966520249, "ground_truth": 0}, {"key": "ad275932d9fb03762cc781e06955fb088e165ad9", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.47657965356605614, "ground_truth": 0}, {"key": "ad275932d9fb03762cc781e06955fb088e165ad9", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.14033625309473038, "ground_truth": 0}, {"key": "ad275932d9fb03762cc781e06955fb088e165ad9", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.12002563442999746, "ground_truth": 0}, {"key": "f9fedde4734d8ac3431c0ed5d338efcd799b1aea", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.07751766308994563, "ground_truth": 0}, {"key": "f9fedde4734d8ac3431c0ed5d338efcd799b1aea", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.10521054460923832, "ground_truth": 0}, {"key": "f9fedde4734d8ac3431c0ed5d338efcd799b1aea", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.16238003048928476, "ground_truth": 0}, {"key": "f9fedde4734d8ac3431c0ed5d338efcd799b1aea", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.14128140788812754, "ground_truth": 0}, {"key": "f9fedde4734d8ac3431c0ed5d338efcd799b1aea", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.17553806961386095, "ground_truth": 0}, {"key": "bbe84a85e38aac4e2cff76da7ce4ed349474db25", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.22000710447051755, "ground_truth": 0}, {"key": "bbe84a85e38aac4e2cff76da7ce4ed349474db25", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.4455295474617793, "ground_truth": 0}, {"key": "bbe84a85e38aac4e2cff76da7ce4ed349474db25", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.41869691837778883, "ground_truth": 0}, {"key": "bbe84a85e38aac4e2cff76da7ce4ed349474db25", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.2720245588382809, "ground_truth": 0}, {"key": "bbe84a85e38aac4e2cff76da7ce4ed349474db25", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.5389832123484716, "ground_truth": 0}, {"key": "45884af9aff9abf54fec27f510c3f9ed000fc6e1", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.523420355384991, "ground_truth": 0}, {"key": "45884af9aff9abf54fec27f510c3f9ed000fc6e1", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.5389831991130848, "ground_truth": 0}, {"key": "45884af9aff9abf54fec27f510c3f9ed000fc6e1", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.6791786934718738, "ground_truth": 0}, {"key": "45884af9aff9abf54fec27f510c3f9ed000fc6e1", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.7401743415849532, "ground_truth": 0}, {"key": "45884af9aff9abf54fec27f510c3f9ed000fc6e1", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.3960681706066721, "ground_truth": 0}, {"key": "59e60ba3c7ea5f5991db8ed4afd368c69e697dde", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.6279512167227714, "ground_truth": 0}, {"key": "59e60ba3c7ea5f5991db8ed4afd368c69e697dde", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.3293917179714657, "ground_truth": 0}, {"key": "59e60ba3c7ea5f5991db8ed4afd368c69e697dde", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.9039745064698314, "ground_truth": 0}, {"key": "59e60ba3c7ea5f5991db8ed4afd368c69e697dde", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.8469578388178995, "ground_truth": 0}, {"key": "59e60ba3c7ea5f5991db8ed4afd368c69e697dde", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.713830740255472, "ground_truth": 0}, {"key": "265ad4cbd8cbad94527db327a39c2d8f33db33ce", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.1490353076893378, "ground_truth": 0}, {"key": "265ad4cbd8cbad94527db327a39c2d8f33db33ce", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.36658974948813167, "ground_truth": 0}, {"key": "265ad4cbd8cbad94527db327a39c2d8f33db33ce", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.3522017846330625, "ground_truth": 0}, {"key": "265ad4cbd8cbad94527db327a39c2d8f33db33ce", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.28457600188060855, "ground_truth": 0}, {"key": "265ad4cbd8cbad94527db327a39c2d8f33db33ce", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.22678361736766373, "ground_truth": 0}, {"key": "54e68f9b7cdd209c09b2a47feef62b9082346031", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.34158250699761183, "ground_truth": 0}, {"key": "54e68f9b7cdd209c09b2a47feef62b9082346031", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.31237000393532144, "ground_truth": 0}, {"key": "54e68f9b7cdd209c09b2a47feef62b9082346031", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.503906169242512, "ground_truth": 0}, {"key": "54e68f9b7cdd209c09b2a47feef62b9082346031", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.8244619440349475, "ground_truth": 0}, {"key": "54e68f9b7cdd209c09b2a47feef62b9082346031", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.6076631563890835, "ground_truth": 0}, {"key": "3b5e3dff560e2233e8370c87e9d92461200f8bd4", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.20181321436181598, "ground_truth": 0}, {"key": "3b5e3dff560e2233e8370c87e9d92461200f8bd4", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.1052105307981583, "ground_truth": 0}, {"key": "3b5e3dff560e2233e8370c87e9d92461200f8bd4", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.25386099519579813, "ground_truth": 0}, {"key": "3b5e3dff560e2233e8370c87e9d92461200f8bd4", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.19806417594020265, "ground_truth": 0}, {"key": "3b5e3dff560e2233e8370c87e9d92461200f8bd4", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.3720487786263703, "ground_truth": 0}, {"key": "242c51d129c998a2585feee12e109a2058eb7c2b", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.18952110351913856, "ground_truth": 0}, {"key": "242c51d129c998a2585feee12e109a2058eb7c2b", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.6531269241886686, "ground_truth": 0}, {"key": "242c51d129c998a2585feee12e109a2058eb7c2b", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.18476751789687115, "ground_truth": 0}, {"key": "242c51d129c998a2585feee12e109a2058eb7c2b", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.07807815960034421, "ground_truth": 0}, {"key": "242c51d129c998a2585feee12e109a2058eb7c2b", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.2018132199078233, "ground_truth": 0}, {"key": "5ce92746bc1f4f5cbb25956c1289ffcd7f50f07e", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.38306420041516737, "ground_truth": 0}, {"key": "5ce92746bc1f4f5cbb25956c1289ffcd7f50f07e", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.43974732835446806, "ground_truth": 0}, {"key": "5ce92746bc1f4f5cbb25956c1289ffcd7f50f07e", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.2720245667023162, "ground_truth": 0}, {"key": "5ce92746bc1f4f5cbb25956c1289ffcd7f50f07e", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.18952109479842028, "ground_truth": 0}, {"key": "5ce92746bc1f4f5cbb25956c1289ffcd7f50f07e", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.3757064826506748, "ground_truth": 0}, {"key": "2f32a9eebbfa707a264d82a3bef5557f6b3b5f20", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.32939170443403715, "ground_truth": 0}, {"key": "2f32a9eebbfa707a264d82a3bef5557f6b3b5f20", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.3757064627083445, "ground_truth": 0}, {"key": "2f32a9eebbfa707a264d82a3bef5557f6b3b5f20", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.2814055933579276, "ground_truth": 0}, {"key": "2f32a9eebbfa707a264d82a3bef5557f6b3b5f20", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.32252596760137503, "ground_truth": 0}, {"key": "2f32a9eebbfa707a264d82a3bef5557f6b3b5f20", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.5583270011189587, "ground_truth": 0}, {"key": "57a373fa7d17600396fcee99164e79c0edccad14", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.3647775701925191, "ground_truth": 0}, {"key": "57a373fa7d17600396fcee99164e79c0edccad14", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.5467381586374779, "ground_truth": 0}, {"key": "57a373fa7d17600396fcee99164e79c0edccad14", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.6654105589320659, "ground_truth": 0}, {"key": "57a373fa7d17600396fcee99164e79c0edccad14", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.8267117999362539, "ground_truth": 0}, {"key": "57a373fa7d17600396fcee99164e79c0edccad14", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.7325918428484481, "ground_truth": 0}, {"key": "9b087c5572cc091c519625d37d1a614b97b8ed30", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.3629691891481823, "ground_truth": 0}, {"key": "9b087c5572cc091c519625d37d1a614b97b8ed30", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.20434190194641355, "ground_truth": 0}, {"key": "9b087c5572cc091c519625d37d1a614b97b8ed30", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.2674081609102495, "ground_truth": 0}, {"key": "9b087c5572cc091c519625d37d1a614b97b8ed30", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.27048022419146445, "ground_truth": 0}, {"key": "9b087c5572cc091c519625d37d1a614b97b8ed30", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.16238003306927903, "ground_truth": 0}, {"key": "b5211115ff68e12e759a474a02d3b163211af563", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.3191213859403731, "ground_truth": 0}, {"key": "b5211115ff68e12e759a474a02d3b163211af563", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.6169358487412087, "ground_truth": 0}, {"key": "b5211115ff68e12e759a474a02d3b163211af563", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.3328523402657796, "ground_truth": 0}, {"key": "b5211115ff68e12e759a474a02d3b163211af563", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.70089481940184, "ground_truth": 0}, {"key": "b5211115ff68e12e759a474a02d3b163211af563", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.5983121924257461, "ground_truth": 0}, {"key": "6b75abea2de5c9c9952af0427ccec78910ac811f", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.6406358554955605, "ground_truth": 0}, {"key": "6b75abea2de5c9c9952af0427ccec78910ac811f", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.31405054722468, "ground_truth": 0}, {"key": "6b75abea2de5c9c9952af0427ccec78910ac811f", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.28776780051846385, "ground_truth": 0}, {"key": "6b75abea2de5c9c9952af0427ccec78910ac811f", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.2674081696223769, "ground_truth": 0}, {"key": "6b75abea2de5c9c9952af0427ccec78910ac811f", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.20689405736739205, "ground_truth": 0}, {"key": "259cc1db3d4c814dafc02ed071327f65a7b9eaad", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.1451153563608428, "ground_truth": 0}, {"key": "259cc1db3d4c814dafc02ed071327f65a7b9eaad", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.28140561799207237, "ground_truth": 0}, {"key": "259cc1db3d4c814dafc02ed071327f65a7b9eaad", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.3007455780398716, "ground_truth": 0}, {"key": "259cc1db3d4c814dafc02ed071327f65a7b9eaad", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.21337717840054735, "ground_truth": 0}, {"key": "259cc1db3d4c814dafc02ed071327f65a7b9eaad", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.21337716268867044, "ground_truth": 0}, {"key": "3bb1cda1e01cb6e14f6190ced3b1ec3f7ef50de9", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.37754066170745837, "ground_truth": 0}, {"key": "3bb1cda1e01cb6e14f6190ced3b1ec3f7ef50de9", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.26894145230121186, "ground_truth": 0}, {"key": "3bb1cda1e01cb6e14f6190ced3b1ec3f7ef50de9", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.7057850319775281, "ground_truth": 0}, {"key": "3bb1cda1e01cb6e14f6190ced3b1ec3f7ef50de9", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.15002881984103836, "ground_truth": 0}, {"key": "3bb1cda1e01cb6e14f6190ced3b1ec3f7ef50de9", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.35577487325238116, "ground_truth": 0}, {"key": "7afbe903f1f7cdc1af509583649babf481d01729", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.29421496699196426, "ground_truth": 0}, {"key": "7afbe903f1f7cdc1af509583649babf481d01729", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.5350984117004386, "ground_truth": 0}, {"key": "7afbe903f1f7cdc1af509583649babf481d01729", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.3979384212907754, "ground_truth": 0}, {"key": "7afbe903f1f7cdc1af509583649babf481d01729", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.3522017767498443, "ground_truth": 0}, {"key": "7afbe903f1f7cdc1af509583649babf481d01729", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.18952109482081828, "ground_truth": 0}, {"key": "79d625a3311f4ff11598a3ae4fca63103e84e9a1", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.13117322220237504, "ground_truth": 0}, {"key": "79d625a3311f4ff11598a3ae4fca63103e84e9a1", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.1311732165077992, "ground_truth": 0}, {"key": "79d625a3311f4ff11598a3ae4fca63103e84e9a1", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.07531230507164206, "ground_truth": 0}, {"key": "79d625a3311f4ff11598a3ae4fca63103e84e9a1", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.15203224428946024, "ground_truth": 0}, {"key": "79d625a3311f4ff11598a3ae4fca63103e84e9a1", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.0980793212210091, "ground_truth": 0}, {"key": "ea6c4267f17d55f1bd9f0950c31ef59565bdc30b", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.2735743993939431, "ground_truth": 0}, {"key": "ea6c4267f17d55f1bd9f0950c31ef59565bdc30b", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.210766302439643, "ground_truth": 0}, {"key": "ea6c4267f17d55f1bd9f0950c31ef59565bdc30b", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.23934934755964843, "ground_truth": 0}, {"key": "ea6c4267f17d55f1bd9f0950c31ef59565bdc30b", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.12678517273718176, "ground_truth": 0}, {"key": "ea6c4267f17d55f1bd9f0950c31ef59565bdc30b", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.21076630042168998, "ground_truth": 0}, {"key": "851d02b689bec14607574096bb77b9acf53c15ee", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.2379298876553369, "ground_truth": 0}, {"key": "851d02b689bec14607574096bb77b9acf53c15ee", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.46295862635734536, "ground_truth": 0}, {"key": "851d02b689bec14607574096bb77b9acf53c15ee", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.23091975128942013, "ground_truth": 0}, {"key": "851d02b689bec14607574096bb77b9acf53c15ee", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.13386748345444274, "ground_truth": 0}, {"key": "851d02b689bec14607574096bb77b9acf53c15ee", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.3311197420690847, "ground_truth": 0}, {"key": "f2d00c8c396698becc18fd2b41ba595c7a3e1cc6", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.44167300717443003, "ground_truth": 0}, {"key": "f2d00c8c396698becc18fd2b41ba595c7a3e1cc6", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.9582261180659236, "ground_truth": 0}, {"key": "f2d00c8c396698becc18fd2b41ba595c7a3e1cc6", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.8577681084757321, "ground_truth": 0}, {"key": "f2d00c8c396698becc18fd2b41ba595c7a3e1cc6", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.8723473774528121, "ground_truth": 0}, {"key": "f2d00c8c396698becc18fd2b41ba595c7a3e1cc6", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.8998277744037131, "ground_truth": 0}, {"key": "70c6ca3234f9b1221c8aea7671dd78e1ca9d9139", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.22678363410275099, "ground_truth": 0}, {"key": "70c6ca3234f9b1221c8aea7671dd78e1ca9d9139", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.4707366082893448, "ground_truth": 0}, {"key": "70c6ca3234f9b1221c8aea7671dd78e1ca9d9139", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.40922079936638783, "ground_truth": 0}, {"key": "70c6ca3234f9b1221c8aea7671dd78e1ca9d9139", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.4863315532221885, "ground_truth": 0}, {"key": "70c6ca3234f9b1221c8aea7671dd78e1ca9d9139", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.30569730895553765, "ground_truth": 0}, {"key": "86eaa90c419d5ed93341248fecd8c25d820f2b82", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.094677708410163, "ground_truth": 0}, {"key": "86eaa90c419d5ed93341248fecd8c25d820f2b82", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.4320633816520848, "ground_truth": 0}, {"key": "86eaa90c419d5ed93341248fecd8c25d820f2b82", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.11676401412753087, "ground_truth": 0}, {"key": "86eaa90c419d5ed93341248fecd8c25d820f2b82", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.14414884841575115, "ground_truth": 0}, {"key": "86eaa90c419d5ed93341248fecd8c25d820f2b82", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.16238003281385135, "ground_truth": 0}, {"key": "a1841cf61c53937fffc54c0e81d8f7cfcad2f0c2", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.34158249760631093, "ground_truth": 0}, {"key": "a1841cf61c53937fffc54c0e81d8f7cfcad2f0c2", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.4590761407119771, "ground_truth": 0}, {"key": "a1841cf61c53937fffc54c0e81d8f7cfcad2f0c2", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.23934933213329984, "ground_truth": 0}, {"key": "a1841cf61c53937fffc54c0e81d8f7cfcad2f0c2", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.14318771794249505, "ground_truth": 0}, {"key": "a1841cf61c53937fffc54c0e81d8f7cfcad2f0c2", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.3380771337240241, "ground_truth": 0}, {"key": "5d221c86fdadca378eeaabc39c881cc74efcff07", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.08570927366720951, "ground_truth": 0}, {"key": "5d221c86fdadca378eeaabc39c881cc74efcff07", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.3276682986123106, "ground_truth": 0}, {"key": "5d221c86fdadca378eeaabc39c881cc74efcff07", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.04707417928449974, "ground_truth": 0}, {"key": "5d221c86fdadca378eeaabc39c881cc74efcff07", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.2553436387910023, "ground_truth": 0}, {"key": "5d221c86fdadca378eeaabc39c881cc74efcff07", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.43398146947245547, "ground_truth": 0}, {"key": "7a49f5bc1d336309f57076bceba91885ee5368b5", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.4843801054830065, "ground_truth": 0}, {"key": "7a49f5bc1d336309f57076bceba91885ee5368b5", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.4225046414917185, "ground_truth": 0}, {"key": "7a49f5bc1d336309f57076bceba91885ee5368b5", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.2845760172181393, "ground_truth": 0}, {"key": "7a49f5bc1d336309f57076bceba91885ee5368b5", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.2991051777882945, "ground_truth": 0}, {"key": "7a49f5bc1d336309f57076bceba91885ee5368b5", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.2735743924070339, "ground_truth": 0}, {"key": "dd46893fd318dce4e209f9a335612659ebf8fd24", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.22541662386699038, "ground_truth": 0}, {"key": "dd46893fd318dce4e209f9a335612659ebf8fd24", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.5621764899612708, "ground_truth": 0}, {"key": "dd46893fd318dce4e209f9a335612659ebf8fd24", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.22815650628665532, "ground_truth": 0}, {"key": "dd46893fd318dce4e209f9a335612659ebf8fd24", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.3593641549711123, "ground_truth": 0}, {"key": "dd46893fd318dce4e209f9a335612659ebf8fd24", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.31069438876466454, "ground_truth": 0}, {"key": "acda8749fba5e9553e9f47cef89ef85eae5ad4e3", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.30239108422737754, "ground_truth": 0}, {"key": "acda8749fba5e9553e9f47cef89ef85eae5ad4e3", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.3415824907026145, "ground_truth": 0}, {"key": "acda8749fba5e9553e9f47cef89ef85eae5ad4e3", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.3023910763006377, "ground_truth": 0}, {"key": "acda8749fba5e9553e9f47cef89ef85eae5ad4e3", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.2909808806881962, "ground_truth": 0}, {"key": "acda8749fba5e9553e9f47cef89ef85eae5ad4e3", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.6169358288094389, "ground_truth": 0}, {"key": "20b11518df6520f552d691d5f6c0d02755d11809", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.4416730230499745, "ground_truth": 0}, {"key": "20b11518df6520f552d691d5f6c0d02755d11809", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.5506073400757326, "ground_truth": 0}, {"key": "20b11518df6520f552d691d5f6c0d02755d11809", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.34334175533393374, "ground_truth": 0}, {"key": "20b11518df6520f552d691d5f6c0d02755d11809", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.4282333862168667, "ground_truth": 0}, {"key": "20b11518df6520f552d691d5f6c0d02755d11809", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.6132365590716689, "ground_truth": 0}, {"key": "51fe083191bb5568bf6a5fea1610a8e19663d7b2", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.18359363260015518, "ground_truth": 0}, {"key": "51fe083191bb5568bf6a5fea1610a8e19663d7b2", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.16238002395489484, "ground_truth": 0}, {"key": "51fe083191bb5568bf6a5fea1610a8e19663d7b2", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.2407745900034896, "ground_truth": 0}, {"key": "51fe083191bb5568bf6a5fea1610a8e19663d7b2", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.16238003131306608, "ground_truth": 0}, {"key": "51fe083191bb5568bf6a5fea1610a8e19663d7b2", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.40733341087905806, "ground_truth": 0}, {"key": "8af047c2d83a91e8b745adfcaa7c282dfe1030a2", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.0832919242704918, "ground_truth": 0}, {"key": "8af047c2d83a91e8b745adfcaa7c282dfe1030a2", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.3415824894301658, "ground_truth": 0}, {"key": "8af047c2d83a91e8b745adfcaa7c282dfe1030a2", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.11676401397114554, "ground_truth": 0}, {"key": "8af047c2d83a91e8b745adfcaa7c282dfe1030a2", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.05582313814716004, "ground_truth": 0}, {"key": "8af047c2d83a91e8b745adfcaa7c282dfe1030a2", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.07055959636906514, "ground_truth": 0}, {"key": "dfcacd955a9168b2cf599c57a539dbfce43ea2a9", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.4590761439514445, "ground_truth": 0}, {"key": "dfcacd955a9168b2cf599c57a539dbfce43ea2a9", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.3174262785593555, "ground_truth": 0}, {"key": "dfcacd955a9168b2cf599c57a539dbfce43ea2a9", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.49023563099583806, "ground_truth": 0}, {"key": "dfcacd955a9168b2cf599c57a539dbfce43ea2a9", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.3073580203375096, "ground_truth": 0}, {"key": "dfcacd955a9168b2cf599c57a539dbfce43ea2a9", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.5175708896590616, "ground_truth": 0}, {"key": "f2463954bc7215d8a1f98cf0d85f280fd2affa58", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.22405545993065767, "ground_truth": 0}, {"key": "f2463954bc7215d8a1f98cf0d85f280fd2affa58", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.3311197508134524, "ground_truth": 0}, {"key": "f2463954bc7215d8a1f98cf0d85f280fd2affa58", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.5175708776381782, "ground_truth": 0}, {"key": "f2463954bc7215d8a1f98cf0d85f280fd2affa58", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.18242551687258624, "ground_truth": 0}, {"key": "f2463954bc7215d8a1f98cf0d85f280fd2affa58", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.21076631567061227, "ground_truth": 0}, {"key": "0e7a92a6f06e94cdd613860d4a3f4b92a06a2b43", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.34158249757489756, "ground_truth": 0}, {"key": "0e7a92a6f06e94cdd613860d4a3f4b92a06a2b43", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.4205995615580538, "ground_truth": 0}, {"key": "0e7a92a6f06e94cdd613860d4a3f4b92a06a2b43", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.15610489859700227, "ground_truth": 0}, {"key": "0e7a92a6f06e94cdd613860d4a3f4b92a06a2b43", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.21469142475427272, "ground_truth": 0}, {"key": "0e7a92a6f06e94cdd613860d4a3f4b92a06a2b43", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.3775406805325193, "ground_truth": 0}, {"key": "2905a15c5947042e42f4b52dc201d24822af20f1", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.8376199717130972, "ground_truth": 0}, {"key": "2905a15c5947042e42f4b52dc201d24822af20f1", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.47463117395427085, "ground_truth": 0}, {"key": "2905a15c5947042e42f4b52dc201d24822af20f1", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.6706082891561008, "ground_truth": 0}, {"key": "2905a15c5947042e42f4b52dc201d24822af20f1", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.646013682823884, "ground_truth": 0}, {"key": "2905a15c5947042e42f4b52dc201d24822af20f1", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.588889141975794, "ground_truth": 0}, {"key": "808a3d788317af05686ee71a71d2fbc5c19267bc", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.3073580185870858, "ground_truth": 0}, {"key": "808a3d788317af05686ee71a71d2fbc5c19267bc", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.64063587187805, "ground_truth": 0}, {"key": "808a3d788317af05686ee71a71d2fbc5c19267bc", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.6723316821865741, "ground_truth": 0}, {"key": "808a3d788317af05686ee71a71d2fbc5c19267bc", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.22678364442022658, "ground_truth": 0}, {"key": "808a3d788317af05686ee71a71d2fbc5c19267bc", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.5253688249866885, "ground_truth": 0}, {"key": "5a1bec30205b6938392f3119366e27d15b4849e8", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.49804687478807824, "ground_truth": 0}, {"key": "5a1bec30205b6938392f3119366e27d15b4849e8", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.5679366095067959, "ground_truth": 0}, {"key": "5a1bec30205b6938392f3119366e27d15b4849e8", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.5350984241539528, "ground_truth": 0}, {"key": "5a1bec30205b6938392f3119366e27d15b4849e8", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.6636689521764308, "ground_truth": 0}, {"key": "5a1bec30205b6938392f3119366e27d15b4849e8", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.42823339909111197, "ground_truth": 0}, {"key": "7ff39e1220c0f084434786ed145e15c6abe48def", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.5832033486977368, "ground_truth": 0}, {"key": "7ff39e1220c0f084434786ed145e15c6abe48def", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.6495785888497247, "ground_truth": 0}, {"key": "7ff39e1220c0f084434786ed145e15c6abe48def", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.5774953429762658, "ground_truth": 0}, {"key": "7ff39e1220c0f084434786ed145e15c6abe48def", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.51171659565436, "ground_truth": 0}, {"key": "7ff39e1220c0f084434786ed145e15c6abe48def", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.5273165167614835, "ground_truth": 0}, {"key": "7551503e7e57bd519913b0df90ca1e80d5305b05", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.5253687950480536, "ground_truth": 0}, {"key": "7551503e7e57bd519913b0df90ca1e80d5305b05", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.5679365959802187, "ground_truth": 0}, {"key": "7551503e7e57bd519913b0df90ca1e80d5305b05", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.7718434915391138, "ground_truth": 0}, {"key": "7551503e7e57bd519913b0df90ca1e80d5305b05", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.2538610049936841, "ground_truth": 0}, {"key": "7551503e7e57bd519913b0df90ca1e80d5305b05", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.6334102521613197, "ground_truth": 0}, {"key": "c34a0cbf6db61323766fc86b1b89b399ff6b0666", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.6442251168783752, "ground_truth": 0}, {"key": "c34a0cbf6db61323766fc86b1b89b399ff6b0666", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.3242353849200846, "ground_truth": 0}, {"key": "c34a0cbf6db61323766fc86b1b89b399ff6b0666", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.6477982203507325, "ground_truth": 0}, {"key": "c34a0cbf6db61323766fc86b1b89b399ff6b0666", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.47463119369187995, "ground_truth": 0}, {"key": "c34a0cbf6db61323766fc86b1b89b399ff6b0666", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.8469578477714756, "ground_truth": 0}, {"key": "d07a61368a195444b14bd4b382e0fc3d64890b22", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.44360042479710243, "ground_truth": 0}, {"key": "d07a61368a195444b14bd4b382e0fc3d64890b22", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.3522017750943882, "ground_truth": 0}, {"key": "d07a61368a195444b14bd4b382e0fc3d64890b22", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.4378234995405856, "ground_truth": 0}, {"key": "d07a61368a195444b14bd4b382e0fc3d64890b22", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.16451644490814188, "ground_truth": 0}, {"key": "d07a61368a195444b14bd4b382e0fc3d64890b22", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.18242552362662814, "ground_truth": 0}, {"key": "aa68dee4bc246e5aae9507342f8520a2a301a310", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.18594721119624757, "ground_truth": 0}, {"key": "aa68dee4bc246e5aae9507342f8520a2a301a310", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.28140560198162273, "ground_truth": 0}, {"key": "aa68dee4bc246e5aae9507342f8520a2a301a310", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.07423136964865813, "ground_truth": 0}, {"key": "aa68dee4bc246e5aae9507342f8520a2a301a310", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.06278920654593236, "ground_truth": 0}, {"key": "aa68dee4bc246e5aae9507342f8520a2a301a310", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.12765262344109576, "ground_truth": 0}, {"key": "87ef15064035db73cb29f5cec2f0442f2c527ef0", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.3073580257542765, "ground_truth": 0}, {"key": "87ef15064035db73cb29f5cec2f0442f2c527ef0", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.3276682981029174, "ground_truth": 0}, {"key": "87ef15064035db73cb29f5cec2f0442f2c527ef0", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.17328819716064187, "ground_truth": 0}, {"key": "87ef15064035db73cb29f5cec2f0442f2c527ef0", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.2094696963324007, "ground_truth": 0}, {"key": "87ef15064035db73cb29f5cec2f0442f2c527ef0", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.3557748731197643, "ground_truth": 0}, {"key": "a577b934e210ef7dce07390711f03db8bb2e005a", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.09203286046641661, "ground_truth": 0}, {"key": "a577b934e210ef7dce07390711f03db8bb2e005a", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.35398629732920633, "ground_truth": 0}, {"key": "a577b934e210ef7dce07390711f03db8bb2e005a", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.043042850028755957, "ground_truth": 0}, {"key": "a577b934e210ef7dce07390711f03db8bb2e005a", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.0994702131332389, "ground_truth": 0}, {"key": "a577b934e210ef7dce07390711f03db8bb2e005a", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.12506537885628052, "ground_truth": 0}, {"key": "c9414bf55859cb9ca7e925a4a09b416b6f66446a", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.9473810442021362, "ground_truth": 0}, {"key": "c9414bf55859cb9ca7e925a4a09b416b6f66446a", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.9575961719836584, "ground_truth": 0}, {"key": "c9414bf55859cb9ca7e925a4a09b416b6f66446a", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.9257686322644206, "ground_truth": 0}, {"key": "c9414bf55859cb9ca7e925a4a09b416b6f66446a", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.9511422173453828, "ground_truth": 0}, {"key": "c9414bf55859cb9ca7e925a4a09b416b6f66446a", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.9695556492580248, "ground_truth": 0}, {"key": "f12cda150b96acfa1499b2afb0a81029545abadf", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.4532618744073335, "ground_truth": 0}, {"key": "f12cda150b96acfa1499b2afb0a81029545abadf", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.5428632645314471, "ground_truth": 0}, {"key": "f12cda150b96acfa1499b2afb0a81029545abadf", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.6187804267156339, "ground_truth": 0}, {"key": "f12cda150b96acfa1499b2afb0a81029545abadf", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.757794362594929, "ground_truth": 0}, {"key": "f12cda150b96acfa1499b2afb0a81029545abadf", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.8732148238748632, "ground_truth": 0}, {"key": "7359741b0e60b4402f069963a26c7aa766f45e7c", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.17441027700905737, "ground_truth": 0}, {"key": "7359741b0e60b4402f069963a26c7aa766f45e7c", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.3380771463760054, "ground_truth": 0}, {"key": "7359741b0e60b4402f069963a26c7aa766f45e7c", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.34687308755772395, "ground_truth": 0}, {"key": "7359741b0e60b4402f069963a26c7aa766f45e7c", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.4902356190380038, "ground_truth": 0}, {"key": "7359741b0e60b4402f069963a26c7aa766f45e7c", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.2893716958192038, "ground_truth": 0}, {"key": "b10c71f49dbeabad23325d625e8e7b8529429607", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.5794004136826134, "ground_truth": 0}, {"key": "b10c71f49dbeabad23325d625e8e7b8529429607", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.30902369833118987, "ground_truth": 0}, {"key": "b10c71f49dbeabad23325d625e8e7b8529429607", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.6076631821375182, "ground_truth": 0}, {"key": "b10c71f49dbeabad23325d625e8e7b8529429607", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.6206216026432145, "ground_truth": 0}, {"key": "b10c71f49dbeabad23325d625e8e7b8529429607", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.5640984873870727, "ground_truth": 0}, {"key": "c5a1e04f5f84d406ffedfc2f312c314d1bc03c46", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.14608724796568973, "ground_truth": 0}, {"key": "c5a1e04f5f84d406ffedfc2f312c314d1bc03c46", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.3380771379259138, "ground_truth": 0}, {"key": "c5a1e04f5f84d406ffedfc2f312c314d1bc03c46", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.2958398791287995, "ground_truth": 0}, {"key": "c5a1e04f5f84d406ffedfc2f312c314d1bc03c46", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.16776334000112753, "ground_truth": 0}, {"key": "c5a1e04f5f84d406ffedfc2f312c314d1bc03c46", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.12592276786846635, "ground_truth": 0}, {"key": "8a5035d3527c4db4357dd1db9fb2712008dccea9", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.29583988070759465, "ground_truth": 0}, {"key": "8a5035d3527c4db4357dd1db9fb2712008dccea9", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.18476750020126842, "ground_truth": 0}, {"key": "8a5035d3527c4db4357dd1db9fb2712008dccea9", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.2991052027082614, "ground_truth": 0}, {"key": "8a5035d3527c4db4357dd1db9fb2712008dccea9", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.24798743665045206, "ground_truth": 0}, {"key": "8a5035d3527c4db4357dd1db9fb2712008dccea9", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.2407746002165588, "ground_truth": 0}, {"key": "3f33d4cb25cd121619ba99eeb02709b72716d622", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.8376199700846322, "ground_truth": 0}, {"key": "3f33d4cb25cd121619ba99eeb02709b72716d622", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.7690802507035164, "ground_truth": 0}, {"key": "3f33d4cb25cd121619ba99eeb02709b72716d622", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.8652240796754866, "ground_truth": 0}, {"key": "3f33d4cb25cd121619ba99eeb02709b72716d622", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.935346510200234, "ground_truth": 0}, {"key": "3f33d4cb25cd121619ba99eeb02709b72716d622", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.8615382104537961, "ground_truth": 0}, {"key": "e6f451d6667f142a64818a9d05dbc49115e7cbf9", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.594551256822251, "ground_truth": 0}, {"key": "e6f451d6667f142a64818a9d05dbc49115e7cbf9", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.8832359922593191, "ground_truth": 0}, {"key": "e6f451d6667f142a64818a9d05dbc49115e7cbf9", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.8991213792763312, "ground_truth": 0}, {"key": "e6f451d6667f142a64818a9d05dbc49115e7cbf9", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.6513548590738919, "ground_truth": 0}, {"key": "e6f451d6667f142a64818a9d05dbc49115e7cbf9", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.9149009564129214, "ground_truth": 0}, {"key": "39622c01625247af942a6439699ff529db1d54d0", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.13296425006592175, "ground_truth": 0}, {"key": "39622c01625247af942a6439699ff529db1d54d0", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.13386748640751578, "ground_truth": 0}, {"key": "39622c01625247af942a6439699ff529db1d54d0", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.07864237780161483, "ground_truth": 0}, {"key": "39622c01625247af942a6439699ff529db1d54d0", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.15610489717352544, "ground_truth": 0}, {"key": "39622c01625247af942a6439699ff529db1d54d0", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.127652620371985, "ground_truth": 0}, {"key": "02927c88776bcc84fc883435a5037b4c8ca70e83", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.4843800800049317, "ground_truth": 0}, {"key": "02927c88776bcc84fc883435a5037b4c8ca70e83", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.4359015081489512, "ground_truth": 0}, {"key": "02927c88776bcc84fc883435a5037b4c8ca70e83", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.38491213598265756, "ground_truth": 0}, {"key": "02927c88776bcc84fc883435a5037b4c8ca70e83", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.3720487808614205, "ground_truth": 0}, {"key": "02927c88776bcc84fc883435a5037b4c8ca70e83", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.38491215512787474, "ground_truth": 0}, {"key": "3ee31d8987c07ba4ea9423d39c5e333525316958", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.6224593405087467, "ground_truth": 0}, {"key": "3ee31d8987c07ba4ea9423d39c5e333525316958", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.45326185130276775, "ground_truth": 0}, {"key": "3ee31d8987c07ba4ea9423d39c5e333525316958", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.5832033510181872, "ground_truth": 0}, {"key": "3ee31d8987c07ba4ea9423d39c5e333525316958", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.5660185240603673, "ground_truth": 0}, {"key": "3ee31d8987c07ba4ea9423d39c5e333525316958", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.7248702630138044, "ground_truth": 0}, {"key": "f8ddc6d36f378757d27a244529f8fe11672baa41", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.4130035953623171, "ground_truth": 0}, {"key": "f8ddc6d36f378757d27a244529f8fe11672baa41", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.5039061560240986, "ground_truth": 0}, {"key": "f8ddc6d36f378757d27a244529f8fe11672baa41", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.22678364122025646, "ground_truth": 0}, {"key": "f8ddc6d36f378757d27a244529f8fe11672baa41", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.4167966689538438, "ground_truth": 0}, {"key": "f8ddc6d36f378757d27a244529f8fe11672baa41", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.3830641820941493, "ground_truth": 0}, {"key": "4e97228ceef1be54ab9151fc6759017e6a54a18d", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.13568954676492434, "ground_truth": 0}, {"key": "4e97228ceef1be54ab9151fc6759017e6a54a18d", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.27669053207044453, "ground_truth": 0}, {"key": "4e97228ceef1be54ab9151fc6759017e6a54a18d", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.3486451162212605, "ground_truth": 0}, {"key": "4e97228ceef1be54ab9151fc6759017e6a54a18d", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.46295859004959444, "ground_truth": 0}, {"key": "4e97228ceef1be54ab9151fc6759017e6a54a18d", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.39233682430010164, "ground_truth": 0}, {"key": "0e649ccabaf0e650e9757ee256c2749d37486ba6", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.23091976125981306, "ground_truth": 0}, {"key": "0e649ccabaf0e650e9757ee256c2749d37486ba6", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.2120688101998338, "ground_truth": 0}, {"key": "0e649ccabaf0e650e9757ee256c2749d37486ba6", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.09807932380469217, "ground_truth": 0}, {"key": "0e649ccabaf0e650e9757ee256c2749d37486ba6", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.2030746199008243, "ground_truth": 0}, {"key": "0e649ccabaf0e650e9757ee256c2749d37486ba6", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.282988123565818, "ground_truth": 0}, {"key": "9eccfcc231c7c0d65cb0c333cb3d1731a5fe2f3f", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.13028542352180544, "ground_truth": 0}, {"key": "9eccfcc231c7c0d65cb0c333cb3d1731a5fe2f3f", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.29421496663225377, "ground_truth": 0}, {"key": "9eccfcc231c7c0d65cb0c333cb3d1731a5fe2f3f", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.37387582086486965, "ground_truth": 0}, {"key": "9eccfcc231c7c0d65cb0c333cb3d1731a5fe2f3f", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.11357958431318788, "ground_truth": 0}, {"key": "9eccfcc231c7c0d65cb0c333cb3d1731a5fe2f3f", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.2523840468317349, "ground_truth": 0}, {"key": "ddf109b3de6022a4ecd62ee2cd31d2c2ac51035b", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.13846179074858725, "ground_truth": 0}, {"key": "ddf109b3de6022a4ecd62ee2cd31d2c2ac51035b", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.5544704499002893, "ground_truth": 0}, {"key": "ddf109b3de6022a4ecd62ee2cd31d2c2ac51035b", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.25386102653927456, "ground_truth": 0}, {"key": "ddf109b3de6022a4ecd62ee2cd31d2c2ac51035b", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.10970577175132018, "ground_truth": 0}, {"key": "ddf109b3de6022a4ecd62ee2cd31d2c2ac51035b", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.2018132236655059, "ground_truth": 0}, {"key": "bd92eab23374d95ac4430e2e1a8bf7561c662309", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.5273165247337442, "ground_truth": 0}, {"key": "bd92eab23374d95ac4430e2e1a8bf7561c662309", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.7718434915594796, "ground_truth": 0}, {"key": "bd92eab23374d95ac4430e2e1a8bf7561c662309", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.4882833698858075, "ground_truth": 0}, {"key": "bd92eab23374d95ac4430e2e1a8bf7561c662309", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.8031737921621478, "ground_truth": 0}, {"key": "bd92eab23374d95ac4430e2e1a8bf7561c662309", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.7356416267485172, "ground_truth": 0}, {"key": "d84440effc748f9220c7dde068962e803f566bc7", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.7008948102115948, "ground_truth": 0}, {"key": "d84440effc748f9220c7dde068962e803f566bc7", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.3293917144278715, "ground_truth": 0}, {"key": "d84440effc748f9220c7dde068962e803f566bc7", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.30074560114526006, "ground_truth": 0}, {"key": "d84440effc748f9220c7dde068962e803f566bc7", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.18952109984721166, "ground_truth": 0}, {"key": "d84440effc748f9220c7dde068962e803f566bc7", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.4804786946374233, "ground_truth": 0}, {"key": "e2866f596c85b0191ce812260d23855c70a01192", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.35577487825277243, "ground_truth": 0}, {"key": "e2866f596c85b0191ce812260d23855c70a01192", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.42441200273592294, "ground_truth": 0}, {"key": "e2866f596c85b0191ce812260d23855c70a01192", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.426321592593874, "ground_truth": 0}, {"key": "e2866f596c85b0191ce812260d23855c70a01192", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.3886180047671093, "ground_truth": 0}, {"key": "e2866f596c85b0191ce812260d23855c70a01192", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.38491215842356846, "ground_truth": 0}, {"key": "4ebd9195bc8c12272b6281a5a610a7b5fb49b8cd", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.5428632684241034, "ground_truth": 0}, {"key": "4ebd9195bc8c12272b6281a5a610a7b5fb49b8cd", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.9099070060963955, "ground_truth": 0}, {"key": "4ebd9195bc8c12272b6281a5a610a7b5fb49b8cd", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.922482345131233, "ground_truth": 0}, {"key": "4ebd9195bc8c12272b6281a5a610a7b5fb49b8cd", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.799442314008191, "ground_truth": 0}, {"key": "4ebd9195bc8c12272b6281a5a610a7b5fb49b8cd", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.9032942064008364, "ground_truth": 0}, {"key": "4bd37aa7004cd1fdf1ccb506d2159a2cf26995e0", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.4436004209008843, "ground_truth": 0}, {"key": "4bd37aa7004cd1fdf1ccb506d2159a2cf26995e0", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.40168780617544414, "ground_truth": 0}, {"key": "4bd37aa7004cd1fdf1ccb506d2159a2cf26995e0", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.5058591343000698, "ground_truth": 0}, {"key": "4bd37aa7004cd1fdf1ccb506d2159a2cf26995e0", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.46101677169318367, "ground_truth": 0}, {"key": "4bd37aa7004cd1fdf1ccb506d2159a2cf26995e0", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.5755880108234607, "ground_truth": 0}, {"key": "29b87dc549b8c64b35517e684e79b1da6316bd88", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.445529532259491, "ground_truth": 0}, {"key": "29b87dc549b8c64b35517e684e79b1da6316bd88", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.654894714975444, "ground_truth": 0}, {"key": "29b87dc549b8c64b35517e684e79b1da6316bd88", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.4186969333741876, "ground_truth": 0}, {"key": "29b87dc549b8c64b35517e684e79b1da6316bd88", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.1721718420624259, "ground_truth": 0}, {"key": "29b87dc549b8c64b35517e684e79b1da6316bd88", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.34864514098968497, "ground_truth": 0}, {"key": "d2f2fe0b8797b416bae71305c9d1c874e2fdd0cc", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.2200070932504986, "ground_truth": 0}, {"key": "d2f2fe0b8797b416bae71305c9d1c874e2fdd0cc", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.4205995911338502, "ground_truth": 0}, {"key": "d2f2fe0b8797b416bae71305c9d1c874e2fdd0cc", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.677474010178561, "ground_truth": 0}, {"key": "d2f2fe0b8797b416bae71305c9d1c874e2fdd0cc", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.5331543828897705, "ground_truth": 0}, {"key": "d2f2fe0b8797b416bae71305c9d1c874e2fdd0cc", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.2735743973858915, "ground_truth": 0}, {"key": "0269d39abbea3edadd225fa97d818f5a789b4c72", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.21206880758983446, "ground_truth": 0}, {"key": "0269d39abbea3edadd225fa97d818f5a789b4c72", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.5544704499002893, "ground_truth": 0}, {"key": "0269d39abbea3edadd225fa97d818f5a789b4c72", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.23510837272397703, "ground_truth": 0}, {"key": "0269d39abbea3edadd225fa97d818f5a789b4c72", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.10970577938395369, "ground_truth": 0}, {"key": "0269d39abbea3edadd225fa97d818f5a789b4c72", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.2942149738697663, "ground_truth": 0}, {"key": "394f20c9bee9bc8d0e6a65bac48de57bd9f4733d", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.5273165132795661, "ground_truth": 0}, {"key": "394f20c9bee9bc8d0e6a65bac48de57bd9f4733d", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.4707366022621347, "ground_truth": 0}, {"key": "394f20c9bee9bc8d0e6a65bac48de57bd9f4733d", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.2094696963631928, "ground_truth": 0}, {"key": "394f20c9bee9bc8d0e6a65bac48de57bd9f4733d", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.14033624788101356, "ground_truth": 0}, {"key": "394f20c9bee9bc8d0e6a65bac48de57bd9f4733d", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.5869964376936138, "ground_truth": 0}, {"key": "6e63c8b1ae01ab91b4832222edaf4bb461b6c568", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.17553805712494583, "ground_truth": 0}, {"key": "6e63c8b1ae01ab91b4832222edaf4bb461b6c568", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.2465333388912987, "ground_truth": 0}, {"key": "6e63c8b1ae01ab91b4832222edaf4bb461b6c568", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.2674081633700045, "ground_truth": 0}, {"key": "6e63c8b1ae01ab91b4832222edaf4bb461b6c568", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.33285233781974516, "ground_truth": 0}, {"key": "6e63c8b1ae01ab91b4832222edaf4bb461b6c568", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.24220563554581437, "ground_truth": 0}, {"key": "355875856932fd634aaf7c6b26155403aaf15904", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.4765796565524769, "ground_truth": 0}, {"key": "355875856932fd634aaf7c6b26155403aaf15904", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.3522017617292119, "ground_truth": 0}, {"key": "355875856932fd634aaf7c6b26155403aaf15904", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.5832033551645752, "ground_truth": 0}, {"key": "355875856932fd634aaf7c6b26155403aaf15904", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.23231014917098763, "ground_truth": 0}, {"key": "355875856932fd634aaf7c6b26155403aaf15904", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.40356688315142886, "ground_truth": 0}, {"key": "999523913d281ab57977d79b644f3879ac4d2e37", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.2309197600279927, "ground_truth": 0}, {"key": "999523913d281ab57977d79b644f3879ac4d2e37", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.25832597347010233, "ground_truth": 0}, {"key": "999523913d281ab57977d79b644f3879ac4d2e37", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.30074558850164673, "ground_truth": 0}, {"key": "999523913d281ab57977d79b644f3879ac4d2e37", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.1074374708535645, "ground_truth": 0}, {"key": "999523913d281ab57977d79b644f3879ac4d2e37", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.3225259986524008, "ground_truth": 0}, {"key": "5f7424604ec11358dc6fdfa47732f90422949041", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.6039318272905662, "ground_truth": 0}, {"key": "5f7424604ec11358dc6fdfa47732f90422949041", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.3293917227656929, "ground_truth": 0}, {"key": "5f7424604ec11358dc6fdfa47732f90422949041", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.5945512776567842, "ground_truth": 0}, {"key": "5f7424604ec11358dc6fdfa47732f90422949041", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.36296919306994957, "ground_truth": 0}, {"key": "5f7424604ec11358dc6fdfa47732f90422949041", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.5486734995597995, "ground_truth": 0}, {"key": "fdb2b65b9cb99b7d52559ae647cae293cb5910d3", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.5717666176858206, "ground_truth": 0}, {"key": "fdb2b65b9cb99b7d52559ae647cae293cb5910d3", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.399811633787043, "ground_truth": 0}, {"key": "fdb2b65b9cb99b7d52559ae647cae293cb5910d3", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.6566582831231269, "ground_truth": 0}, {"key": "fdb2b65b9cb99b7d52559ae647cae293cb5910d3", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.39420096665028553, "ground_truth": 0}, {"key": "fdb2b65b9cb99b7d52559ae647cae293cb5910d3", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.38121953902632194, "ground_truth": 0}, {"key": "f974fe1b3777ffc5756322c0bb3f31a9b23ec09a", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.5097643842268536, "ground_truth": 0}, {"key": "f974fe1b3777ffc5756322c0bb3f31a9b23ec09a", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.32423539454281464, "ground_truth": 0}, {"key": "f974fe1b3777ffc5756322c0bb3f31a9b23ec09a", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.33458944723051565, "ground_truth": 0}, {"key": "f974fe1b3777ffc5756322c0bb3f31a9b23ec09a", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.4513265142332926, "ground_truth": 0}, {"key": "f974fe1b3777ffc5756322c0bb3f31a9b23ec09a", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.4532618695789167, "ground_truth": 0}, {"key": "2930e1a7ac24bce649bfbf5f5971e74515e38a0a", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.5350984098313877, "ground_truth": 0}, {"key": "2930e1a7ac24bce649bfbf5f5971e74515e38a0a", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.3647775556705896, "ground_truth": 0}, {"key": "2930e1a7ac24bce649bfbf5f5971e74515e38a0a", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.4882834103952426, "ground_truth": 0}, {"key": "2930e1a7ac24bce649bfbf5f5971e74515e38a0a", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.3998116647472522, "ground_truth": 0}, {"key": "2930e1a7ac24bce649bfbf5f5971e74515e38a0a", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.4629586026050301, "ground_truth": 0}, {"key": "f5f7571a69e96c1d288d939861b7216c2bdc0ae4", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.30074558118117956, "ground_truth": 0}, {"key": "f5f7571a69e96c1d288d939861b7216c2bdc0ae4", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.332852330469319, "ground_truth": 0}, {"key": "f5f7571a69e96c1d288d939861b7216c2bdc0ae4", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.19682620533496709, "ground_truth": 0}, {"key": "f5f7571a69e96c1d288d939861b7216c2bdc0ae4", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.2281564978097784, "ground_truth": 0}, {"key": "f5f7571a69e96c1d288d939861b7216c2bdc0ae4", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.3468730781923144, "ground_truth": 0}, {"key": "5f02aa32bd1dc95e47355755398e31550b232f8a", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.17441028103677805, "ground_truth": 0}, {"key": "5f02aa32bd1dc95e47355755398e31550b232f8a", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.17441027926068844, "ground_truth": 0}, {"key": "5f02aa32bd1dc95e47355755398e31550b232f8a", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.35398629034521334, "ground_truth": 0}, {"key": "5f02aa32bd1dc95e47355755398e31550b232f8a", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.1460872503604958, "ground_truth": 0}, {"key": "5f02aa32bd1dc95e47355755398e31550b232f8a", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.47852882728299784, "ground_truth": 0}, {"key": "9177e5ac94f038749e8d4eb526a65461e0f6df4c", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.5621765146849945, "ground_truth": 0}, {"key": "9177e5ac94f038749e8d4eb526a65461e0f6df4c", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.10894504320351538, "ground_truth": 0}, {"key": "9177e5ac94f038749e8d4eb526a65461e0f6df4c", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.2861692588178182, "ground_truth": 0}, {"key": "9177e5ac94f038749e8d4eb526a65461e0f6df4c", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.24798743710190943, "ground_truth": 0}, {"key": "9177e5ac94f038749e8d4eb526a65461e0f6df4c", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.19559408085827096, "ground_truth": 0}, {"key": "f12e4bbb07211de7d43b4e331dc73404aa804562", "model": "xsum_length_ft_llama", "target_model": "llama", "recognition_score": 0.9653811621289118, "ground_truth": 0}, {"key": "f12e4bbb07211de7d43b4e331dc73404aa804562", "model": "xsum_length_ft_llama", "target_model": "human", "recognition_score": 0.9637799415120681, "ground_truth": 0}, {"key": "f12e4bbb07211de7d43b4e331dc73404aa804562", "model": "xsum_length_ft_llama", "target_model": "claude", "recognition_score": 0.9553191297617944, "ground_truth": 0}, {"key": "f12e4bbb07211de7d43b4e331dc73404aa804562", "model": "xsum_length_ft_llama", "target_model": "gpt4", "recognition_score": 0.9582261206010038, "ground_truth": 0}, {"key": "f12e4bbb07211de7d43b4e331dc73404aa804562", "model": "xsum_length_ft_llama", "target_model": "gpt35", "recognition_score": 0.9763105297344868, "ground_truth": 0}]