[{"key": "42c027e4ff9730fbb3de84c1af0d2c506e41c3e4", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.21076629049298767, "ground_truth": 0}, {"key": "42c027e4ff9730fbb3de84c1af0d2c506e41c3e4", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.1393963764704882, "ground_truth": 0}, {"key": "42c027e4ff9730fbb3de84c1af0d2c506e41c3e4", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.10374862859993335, "ground_truth": 0}, {"key": "42c027e4ff9730fbb3de84c1af0d2c506e41c3e4", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.22541661239269062, "ground_truth": 0}, {"key": "42c027e4ff9730fbb3de84c1af0d2c506e41c3e4", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.1370697790215486, "ground_truth": 0}, {"key": "ee8871b15c50d0db17b0179a6d2beab35065f1e9", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.2814056155398292, "ground_truth": 0}, {"key": "ee8871b15c50d0db17b0179a6d2beab35065f1e9", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.07477004861082319, "ground_truth": 0}, {"key": "ee8871b15c50d0db17b0179a6d2beab35065f1e9", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.2942149656102029, "ground_truth": 0}, {"key": "ee8871b15c50d0db17b0179a6d2beab35065f1e9", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.5467381427384451, "ground_truth": 0}, {"key": "ee8871b15c50d0db17b0179a6d2beab35065f1e9", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.6113819764848363, "ground_truth": 0}, {"key": "06352019a19ae31e527f37f7571c6dd7f0c5da37", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.24944721725996138, "ground_truth": 0}, {"key": "06352019a19ae31e527f37f7571c6dd7f0c5da37", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.2720245578680495, "ground_truth": 0}, {"key": "06352019a19ae31e527f37f7571c6dd7f0c5da37", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.07423136616786383, "ground_truth": 0}, {"key": "06352019a19ae31e527f37f7571c6dd7f0c5da37", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.04940524709823738, "ground_truth": 0}, {"key": "06352019a19ae31e527f37f7571c6dd7f0c5da37", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.294214982728498, "ground_truth": 0}, {"key": "24521a2abb2e1f5e34e6824e0f9e56904a2b0e88", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.1812632170063898, "ground_truth": 0}, {"key": "24521a2abb2e1f5e34e6824e0f9e56904a2b0e88", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.4416730208992776, "ground_truth": 0}, {"key": "24521a2abb2e1f5e34e6824e0f9e56904a2b0e88", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.1931473725925378, "ground_truth": 0}, {"key": "24521a2abb2e1f5e34e6824e0f9e56904a2b0e88", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.07423137015959537, "ground_truth": 0}, {"key": "24521a2abb2e1f5e34e6824e0f9e56904a2b0e88", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.24944724117735537, "ground_truth": 0}, {"key": "7fe70cc8b12fab2d0a258fababf7d9c6b5e1262a", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.33807713877446327, "ground_truth": 0}, {"key": "7fe70cc8b12fab2d0a258fababf7d9c6b5e1262a", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.472683482046844, "ground_truth": 0}, {"key": "7fe70cc8b12fab2d0a258fababf7d9c6b5e1262a", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.6001883541905481, "ground_truth": 0}, {"key": "7fe70cc8b12fab2d0a258fababf7d9c6b5e1262a", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.12002562626770565, "ground_truth": 0}, {"key": "7fe70cc8b12fab2d0a258fababf7d9c6b5e1262a", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.4941408782346489, "ground_truth": 0}, {"key": "a1ebb8bb4d370a1fdf28769206d572be60642d70", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.665410559274756, "ground_truth": 0}, {"key": "a1ebb8bb4d370a1fdf28769206d572be60642d70", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.4785288309726251, "ground_truth": 0}, {"key": "a1ebb8bb4d370a1fdf28769206d572be60642d70", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.6057990549749184, "ground_truth": 0}, {"key": "a1ebb8bb4d370a1fdf28769206d572be60642d70", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.9252299532134551, "ground_truth": 0}, {"key": "a1ebb8bb4d370a1fdf28769206d572be60642d70", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.396068164022758, "ground_truth": 0}, {"key": "7c0e61ac829a3b3b653e2e3e7536cc4881d1f264", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.2509127834800174, "ground_truth": 0}, {"key": "7c0e61ac829a3b3b653e2e3e7536cc4881d1f264", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.7527403331462595, "ground_truth": 0}, {"key": "7c0e61ac829a3b3b653e2e3e7536cc4881d1f264", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.4139508816190773, "ground_truth": 0}, {"key": "7c0e61ac829a3b3b653e2e3e7536cc4881d1f264", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.38121956613159913, "ground_truth": 0}, {"key": "7c0e61ac829a3b3b653e2e3e7536cc4881d1f264", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.44939264399667167, "ground_truth": 0}, {"key": "f0d73bdab711763e745cdc75850861c9018f235d", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.3174262819888676, "ground_truth": 0}, {"key": "f0d73bdab711763e745cdc75850861c9018f235d", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.27512972176190065, "ground_truth": 0}, {"key": "f0d73bdab711763e745cdc75850861c9018f235d", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.08449275323933547, "ground_truth": 0}, {"key": "f0d73bdab711763e745cdc75850861c9018f235d", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.24798743986865515, "ground_truth": 0}, {"key": "f0d73bdab711763e745cdc75850861c9018f235d", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.097390402538527, "ground_truth": 0}, {"key": "5e22bbfc7232418b8d2dd646b952e404df5bd048", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.3007455805050499, "ground_truth": 0}, {"key": "5e22bbfc7232418b8d2dd646b952e404df5bd048", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.16559311895847678, "ground_truth": 0}, {"key": "5e22bbfc7232418b8d2dd646b952e404df5bd048", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.1540575572000426, "ground_truth": 0}, {"key": "5e22bbfc7232418b8d2dd646b952e404df5bd048", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.29098085077595714, "ground_truth": 0}, {"key": "5e22bbfc7232418b8d2dd646b952e404df5bd048", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.20055767068054497, "ground_truth": 0}, {"key": "613d6311ec2c1985bd44707d1796d275452fe156", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.13477592328367324, "ground_truth": 0}, {"key": "613d6311ec2c1985bd44707d1796d275452fe156", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.1325145706650385, "ground_truth": 0}, {"key": "613d6311ec2c1985bd44707d1796d275452fe156", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.18126320110380742, "ground_truth": 0}, {"key": "613d6311ec2c1985bd44707d1796d275452fe156", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.172171850389654, "ground_truth": 0}, {"key": "613d6311ec2c1985bd44707d1796d275452fe156", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.18359363064770087, "ground_truth": 0}, {"key": "017d27d00eb43678c15cb4a8dd4723a035323219", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.9810945542236941, "ground_truth": 0}, {"key": "017d27d00eb43678c15cb4a8dd4723a035323219", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.9564718573879618, "ground_truth": 0}, {"key": "017d27d00eb43678c15cb4a8dd4723a035323219", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.9477691452176598, "ground_truth": 0}, {"key": "017d27d00eb43678c15cb4a8dd4723a035323219", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.9656413101879752, "ground_truth": 0}, {"key": "017d27d00eb43678c15cb4a8dd4723a035323219", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.9567959672813522, "ground_truth": 0}, {"key": "85f55a3e0dd672857aaaaa80954934a57b7a2fbf", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.17553805791300364, "ground_truth": 0}, {"key": "85f55a3e0dd672857aaaaa80954934a57b7a2fbf", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.08945460456712331, "ground_truth": 0}, {"key": "85f55a3e0dd672857aaaaa80954934a57b7a2fbf", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.0863234761278885, "ground_truth": 0}, {"key": "85f55a3e0dd672857aaaaa80954934a57b7a2fbf", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.08570927774474947, "ground_truth": 0}, {"key": "85f55a3e0dd672857aaaaa80954934a57b7a2fbf", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.11757213812195096, "ground_truth": 0}, {"key": "77d7c8cf2a9432e395d629371a12790c563c19f7", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.04434857661746773, "ground_truth": 0}, {"key": "77d7c8cf2a9432e395d629371a12790c563c19f7", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.20946968630415647, "ground_truth": 0}, {"key": "77d7c8cf2a9432e395d629371a12790c563c19f7", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.3023910959883205, "ground_truth": 0}, {"key": "77d7c8cf2a9432e395d629371a12790c563c19f7", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.02153287888625988, "ground_truth": 0}, {"key": "77d7c8cf2a9432e395d629371a12790c563c19f7", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.13753248172800966, "ground_truth": 0}, {"key": "35f0e33de7923036a97ac245d899f990bda5e242", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.011029470042425833, "ground_truth": 0}, {"key": "35f0e33de7923036a97ac245d899f990bda5e242", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.036908068072140914, "ground_truth": 0}, {"key": "35f0e33de7923036a97ac245d899f990bda5e242", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.018055335924582784, "ground_truth": 0}, {"key": "35f0e33de7923036a97ac245d899f990bda5e242", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.01697999206703457, "ground_truth": 0}, {"key": "35f0e33de7923036a97ac245d899f990bda5e242", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.018404891366029817, "ground_truth": 0}, {"key": "2ad31cae96512af5105b9b23f9b681dc732b2605", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.04518375478761571, "ground_truth": 0}, {"key": "2ad31cae96512af5105b9b23f9b681dc732b2605", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.14608724966221986, "ground_truth": 0}, {"key": "2ad31cae96512af5105b9b23f9b681dc732b2605", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.03803509536636716, "ground_truth": 0}, {"key": "2ad31cae96512af5105b9b23f9b681dc732b2605", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.034618839999185594, "ground_truth": 0}, {"key": "2ad31cae96512af5105b9b23f9b681dc732b2605", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.07807816251884558, "ground_truth": 0}, {"key": "0d43b97000ff852282c89d8d105e41495c0ee9bd", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.5486734760112584, "ground_truth": 0}, {"key": "0d43b97000ff852282c89d8d105e41495c0ee9bd", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.20181321524870746, "ground_truth": 0}, {"key": "0d43b97000ff852282c89d8d105e41495c0ee9bd", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.29583986555753916, "ground_truth": 0}, {"key": "0d43b97000ff852282c89d8d105e41495c0ee9bd", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.4263216039572421, "ground_truth": 0}, {"key": "0d43b97000ff852282c89d8d105e41495c0ee9bd", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.6057990572523297, "ground_truth": 0}, {"key": "bf0cd4ccacd4fe045995338f4c44d9cf18000226", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.36477757457327054, "ground_truth": 0}, {"key": "bf0cd4ccacd4fe045995338f4c44d9cf18000226", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.013584391772606421, "ground_truth": 0}, {"key": "bf0cd4ccacd4fe045995338f4c44d9cf18000226", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.04418332048616846, "ground_truth": 0}, {"key": "bf0cd4ccacd4fe045995338f4c44d9cf18000226", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.29583987428273295, "ground_truth": 0}, {"key": "bf0cd4ccacd4fe045995338f4c44d9cf18000226", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.08694166299752973, "ground_truth": 0}, {"key": "2f43e9dfaa43ffbddbce339a8b6403ddce43b38a", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.09670579066067302, "ground_truth": 0}, {"key": "2f43e9dfaa43ffbddbce339a8b6403ddce43b38a", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.4455295384528727, "ground_truth": 0}, {"key": "2f43e9dfaa43ffbddbce339a8b6403ddce43b38a", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.02048855378723241, "ground_truth": 0}, {"key": "2f43e9dfaa43ffbddbce339a8b6403ddce43b38a", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.02635535385383955, "ground_truth": 0}, {"key": "2f43e9dfaa43ffbddbce339a8b6403ddce43b38a", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.04336579923617945, "ground_truth": 0}, {"key": "eb68bc51ed4fc727a1af058192a3fef0916c91e7", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.23934933079226867, "ground_truth": 0}, {"key": "eb68bc51ed4fc727a1af058192a3fef0916c91e7", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.2407745999451902, "ground_truth": 0}, {"key": "eb68bc51ed4fc727a1af058192a3fef0916c91e7", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.5370413717904653, "ground_truth": 0}, {"key": "eb68bc51ed4fc727a1af058192a3fef0916c91e7", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.43590153955354294, "ground_truth": 0}, {"key": "eb68bc51ed4fc727a1af058192a3fef0916c91e7", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.22815649954386777, "ground_truth": 0}, {"key": "ad021a7924ee57491cee8576499ac196b1afeb23", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.051845465448960765, "ground_truth": 0}, {"key": "ad021a7924ee57491cee8576499ac196b1afeb23", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.06536578512089336, "ground_truth": 0}, {"key": "ad021a7924ee57491cee8576499ac196b1afeb23", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.036493767733403015, "ground_truth": 0}, {"key": "ad021a7924ee57491cee8576499ac196b1afeb23", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.022715756230341323, "ground_truth": 0}, {"key": "ad021a7924ee57491cee8576499ac196b1afeb23", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.012970387867071163, "ground_truth": 0}, {"key": "9d7fc7fd9ffbfecb1c458b9929fa02e6c3538368", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.6224593229760568, "ground_truth": 0}, {"key": "9d7fc7fd9ffbfecb1c458b9929fa02e6c3538368", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.609524175020187, "ground_truth": 0}, {"key": "9d7fc7fd9ffbfecb1c458b9929fa02e6c3538368", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.5755880030824122, "ground_truth": 0}, {"key": "9d7fc7fd9ffbfecb1c458b9929fa02e6c3538368", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.6808786247000312, "ground_truth": 0}, {"key": "9d7fc7fd9ffbfecb1c458b9929fa02e6c3538368", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.6740504744456344, "ground_truth": 0}, {"key": "30cb674030b01014d2c87b92f09152857e249631", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.08570928115445044, "ground_truth": 0}, {"key": "30cb674030b01014d2c87b92f09152857e249631", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.04724971670097749, "ground_truth": 0}, {"key": "30cb674030b01014d2c87b92f09152857e249631", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.061424037825658556, "ground_truth": 0}, {"key": "30cb674030b01014d2c87b92f09152857e249631", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.022116588879039906, "ground_truth": 0}, {"key": "30cb674030b01014d2c87b92f09152857e249631", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.02635535310998111, "ground_truth": 0}, {"key": "d41dc7fc05273a37f0aceaf4f3e35a187f12653e", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.3593641393067793, "ground_truth": 0}, {"key": "d41dc7fc05273a37f0aceaf4f3e35a187f12653e", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.20181323090006567, "ground_truth": 0}, {"key": "d41dc7fc05273a37f0aceaf4f3e35a187f12653e", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.17106118801658937, "ground_truth": 0}, {"key": "d41dc7fc05273a37f0aceaf4f3e35a187f12653e", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.15921740476102755, "ground_truth": 0}, {"key": "d41dc7fc05273a37f0aceaf4f3e35a187f12653e", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.2909808551634851, "ground_truth": 0}, {"key": "fbc6a4d0697b2a3e8b549dcb1f80a8ce7bf47e34", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.049039623516446564, "ground_truth": 0}, {"key": "fbc6a4d0697b2a3e8b549dcb1f80a8ce7bf47e34", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.1139734560277384, "ground_truth": 0}, {"key": "fbc6a4d0697b2a3e8b549dcb1f80a8ce7bf47e34", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.0623310362400353, "ground_truth": 0}, {"key": "fbc6a4d0697b2a3e8b549dcb1f80a8ce7bf47e34", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.06278920824223534, "ground_truth": 0}, {"key": "fbc6a4d0697b2a3e8b549dcb1f80a8ce7bf47e34", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.015014747778258017, "ground_truth": 0}, {"key": "0753a471e6908c35bcbc2daa37e21f3a8443b590", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.1456006361490078, "ground_truth": 0}, {"key": "0753a471e6908c35bcbc2daa37e21f3a8443b590", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.17724053102110884, "ground_truth": 0}, {"key": "0753a471e6908c35bcbc2daa37e21f3a8443b590", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.16830943497447848, "ground_truth": 0}, {"key": "0753a471e6908c35bcbc2daa37e21f3a8443b590", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.08977329021838933, "ground_truth": 0}, {"key": "0753a471e6908c35bcbc2daa37e21f3a8443b590", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.10302442787817624, "ground_truth": 0}, {"key": "08450c1bc03472825196be1acb02ac0e13bef939", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.1316190416675501, "ground_truth": 0}, {"key": "08450c1bc03472825196be1acb02ac0e13bef939", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.1645164514543499, "ground_truth": 0}, {"key": "08450c1bc03472825196be1acb02ac0e13bef939", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.14511536308255982, "ground_truth": 0}, {"key": "08450c1bc03472825196be1acb02ac0e13bef939", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.10669059310418619, "ground_truth": 0}, {"key": "08450c1bc03472825196be1acb02ac0e13bef939", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.11676401426312527, "ground_truth": 0}, {"key": "7fa8d9beca50155fd3d71a9087a4311ce321c34b", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.028007521833163032, "ground_truth": 0}, {"key": "7fa8d9beca50155fd3d71a9087a4311ce321c34b", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.005159622977276081, "ground_truth": 0}, {"key": "7fa8d9beca50155fd3d71a9087a4311ce321c34b", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.004264634879615234, "ground_truth": 0}, {"key": "7fa8d9beca50155fd3d71a9087a4311ce321c34b", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.007968814783124707, "ground_truth": 0}, {"key": "7fa8d9beca50155fd3d71a9087a4311ce321c34b", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.00851130321349106, "ground_truth": 0}, {"key": "414a5b8ecbe189d2767c75b839775a1dcafaf4d3", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.057071398874019574, "ground_truth": 0}, {"key": "414a5b8ecbe189d2767c75b839775a1dcafaf4d3", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.12252320794924017, "ground_truth": 0}, {"key": "414a5b8ecbe189d2767c75b839775a1dcafaf4d3", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.04468087323332785, "ground_truth": 0}, {"key": "414a5b8ecbe189d2767c75b839775a1dcafaf4d3", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.008315779357163553, "ground_truth": 0}, {"key": "414a5b8ecbe189d2767c75b839775a1dcafaf4d3", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.06608537865713764, "ground_truth": 0}, {"key": "cac7a712935380d74410a7cba8d406235d51249a", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.7994423187283157, "ground_truth": 0}, {"key": "cac7a712935380d74410a7cba8d406235d51249a", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.3923368424066519, "ground_truth": 0}, {"key": "cac7a712935380d74410a7cba8d406235d51249a", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.17106118214916535, "ground_truth": 0}, {"key": "cac7a712935380d74410a7cba8d406235d51249a", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.8976952986798796, "ground_truth": 0}, {"key": "cac7a712935380d74410a7cba8d406235d51249a", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.3665897455833164, "ground_truth": 0}, {"key": "e9093ca0a82f2aba28cd2762942c04177cfbb000", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.08882029321313677, "ground_truth": 0}, {"key": "e9093ca0a82f2aba28cd2762942c04177cfbb000", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.2583259826194129, "ground_truth": 0}, {"key": "e9093ca0a82f2aba28cd2762942c04177cfbb000", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.2568319970299771, "ground_truth": 0}, {"key": "e9093ca0a82f2aba28cd2762942c04177cfbb000", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.08449275809461156, "ground_truth": 0}, {"key": "e9093ca0a82f2aba28cd2762942c04177cfbb000", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.08632347749485039, "ground_truth": 0}, {"key": "55a6aabd120f0b18297f7efe22452f9b3aca0d8d", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.2766905448607338, "ground_truth": 0}, {"key": "55a6aabd120f0b18297f7efe22452f9b3aca0d8d", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.5467381874216043, "ground_truth": 0}, {"key": "55a6aabd120f0b18297f7efe22452f9b3aca0d8d", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.3923368335009373, "ground_truth": 0}, {"key": "55a6aabd120f0b18297f7efe22452f9b3aca0d8d", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.4843800994878622, "ground_truth": 0}, {"key": "55a6aabd120f0b18297f7efe22452f9b3aca0d8d", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.6757646230228532, "ground_truth": 0}, {"key": "06bc2f0272d033b123e9eebbb221c62d7d51c283", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.25832598235510135, "ground_truth": 0}, {"key": "06bc2f0272d033b123e9eebbb221c62d7d51c283", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.10894503590221191, "ground_truth": 0}, {"key": "06bc2f0272d033b123e9eebbb221c62d7d51c283", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.18952109842324813, "ground_truth": 0}, {"key": "06bc2f0272d033b123e9eebbb221c62d7d51c283", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.04304284965211429, "ground_truth": 0}, {"key": "06bc2f0272d033b123e9eebbb221c62d7d51c283", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.2735743910024402, "ground_truth": 0}, {"key": "17e43e8e7d2bbbb237df78537d108c3fa917d9fb", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.7356416469850634, "ground_truth": 0}, {"key": "17e43e8e7d2bbbb237df78537d108c3fa917d9fb", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.8955226818801962, "ground_truth": 0}, {"key": "17e43e8e7d2bbbb237df78537d108c3fa917d9fb", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.43398144296846936, "ground_truth": 0}, {"key": "17e43e8e7d2bbbb237df78537d108c3fa917d9fb", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.6388352769282215, "ground_truth": 0}, {"key": "17e43e8e7d2bbbb237df78537d108c3fa917d9fb", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.5964331419445387, "ground_truth": 0}, {"key": "ddcdeb9bdd19fa23f9495c85d48eeee910f33102", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.8661325130491163, "ground_truth": 0}, {"key": "ddcdeb9bdd19fa23f9495c85d48eeee910f33102", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.9178933667911334, "ground_truth": 0}, {"key": "ddcdeb9bdd19fa23f9495c85d48eeee910f33102", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.958847114258604, "ground_truth": 0}, {"key": "ddcdeb9bdd19fa23f9495c85d48eeee910f33102", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.6671476555982392, "ground_truth": 0}, {"key": "ddcdeb9bdd19fa23f9495c85d48eeee910f33102", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.7520125630148533, "ground_truth": 0}, {"key": "ee0ba7928d8987f2cb21c9a2012a76730f77de45", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.03567855496921906, "ground_truth": 0}, {"key": "ee0ba7928d8987f2cb21c9a2012a76730f77de45", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.16132023576684507, "ground_truth": 0}, {"key": "ee0ba7928d8987f2cb21c9a2012a76730f77de45", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.09073548484957498, "ground_truth": 0}, {"key": "ee0ba7928d8987f2cb21c9a2012a76730f77de45", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.21337717373568657, "ground_truth": 0}, {"key": "ee0ba7928d8987f2cb21c9a2012a76730f77de45", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.3775406649320874, "ground_truth": 0}, {"key": "554fd99f28ae12472c5d99ef6383bb184744c25a", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.12002563829405881, "ground_truth": 0}, {"key": "554fd99f28ae12472c5d99ef6383bb184744c25a", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.13296424148614958, "ground_truth": 0}, {"key": "554fd99f28ae12472c5d99ef6383bb184744c25a", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.05623634326135687, "ground_truth": 0}, {"key": "554fd99f28ae12472c5d99ef6383bb184744c25a", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.05127242001483291, "ground_truth": 0}, {"key": "554fd99f28ae12472c5d99ef6383bb184744c25a", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.08509904538116787, "ground_truth": 0}, {"key": "9e141ebc1c06d483bf85f4e5c8b3c7bc2d00ea2f", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.11279540174758715, "ground_truth": 0}, {"key": "9e141ebc1c06d483bf85f4e5c8b3c7bc2d00ea2f", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.1925393520275896, "ground_truth": 0}, {"key": "9e141ebc1c06d483bf85f4e5c8b3c7bc2d00ea2f", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.18772760190558424, "ground_truth": 0}, {"key": "9e141ebc1c06d483bf85f4e5c8b3c7bc2d00ea2f", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.34334174758182306, "ground_truth": 0}, {"key": "9e141ebc1c06d483bf85f4e5c8b3c7bc2d00ea2f", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.12721827776178346, "ground_truth": 0}, {"key": "c9160e2f5ce386dabb10517e7a5c0933c01a9546", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.47268349079762134, "ground_truth": 0}, {"key": "c9160e2f5ce386dabb10517e7a5c0933c01a9546", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.317426284946119, "ground_truth": 0}, {"key": "c9160e2f5ce386dabb10517e7a5c0933c01a9546", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.25238405410375153, "ground_truth": 0}, {"key": "c9160e2f5ce386dabb10517e7a5c0933c01a9546", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.21337716962060194, "ground_truth": 0}, {"key": "c9160e2f5ce386dabb10517e7a5c0933c01a9546", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.3960681562971359, "ground_truth": 0}, {"key": "d256aee1a47eb5b489dee6fb72ab7f7d1483a37f", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.04995852360598042, "ground_truth": 0}, {"key": "d256aee1a47eb5b489dee6fb72ab7f7d1483a37f", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.033211168663843646, "ground_truth": 0}, {"key": "d256aee1a47eb5b489dee6fb72ab7f7d1483a37f", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.5234203489669268, "ground_truth": 0}, {"key": "d256aee1a47eb5b489dee6fb72ab7f7d1483a37f", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.6113819767927606, "ground_truth": 0}, {"key": "d256aee1a47eb5b489dee6fb72ab7f7d1483a37f", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.1276526189798465, "ground_truth": 0}, {"key": "2fff2bc541ef34a6647dfa2e4294cdcc187e47b9", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.152032248687618, "ground_truth": 0}, {"key": "2fff2bc541ef34a6647dfa2e4294cdcc187e47b9", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.33807713406001555, "ground_truth": 0}, {"key": "2fff2bc541ef34a6647dfa2e4294cdcc187e47b9", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.10970577831055214, "ground_truth": 0}, {"key": "2fff2bc541ef34a6647dfa2e4294cdcc187e47b9", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.11124121744397177, "ground_truth": 0}, {"key": "2fff2bc541ef34a6647dfa2e4294cdcc187e47b9", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.08329193172573744, "ground_truth": 0}, {"key": "677375a4c69e81ab623af7c06a6b0a8d03d6350e", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.14033625720975332, "ground_truth": 0}, {"key": "677375a4c69e81ab623af7c06a6b0a8d03d6350e", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.2966542763760849, "ground_truth": 0}, {"key": "677375a4c69e81ab623af7c06a6b0a8d03d6350e", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.1738485139219837, "ground_truth": 0}, {"key": "677375a4c69e81ab623af7c06a6b0a8d03d6350e", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.23231015227377008, "ground_truth": 0}, {"key": "677375a4c69e81ab623af7c06a6b0a8d03d6350e", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.09704755847965457, "ground_truth": 0}, {"key": "33530f97118cc905b05cb920671492c7bfdf3a3b", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.14511535705919776, "ground_truth": 0}, {"key": "33530f97118cc905b05cb920671492c7bfdf3a3b", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.9505947503563437, "ground_truth": 0}, {"key": "33530f97118cc905b05cb920671492c7bfdf3a3b", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.1175721339041357, "ground_truth": 0}, {"key": "33530f97118cc905b05cb920671492c7bfdf3a3b", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.33285233322258684, "ground_truth": 0}, {"key": "33530f97118cc905b05cb920671492c7bfdf3a3b", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.1510277969769124, "ground_truth": 0}, {"key": "3c19a753303ae0d67b3ae28e070c0f4157ffc52d", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.09073548775424924, "ground_truth": 0}, {"key": "3c19a753303ae0d67b3ae28e070c0f4157ffc52d", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.046033899301650284, "ground_truth": 0}, {"key": "3c19a753303ae0d67b3ae28e070c0f4157ffc52d", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.039937317104827376, "ground_truth": 0}, {"key": "3c19a753303ae0d67b3ae28e070c0f4157ffc52d", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.0255652129109395, "ground_truth": 0}, {"key": "3c19a753303ae0d67b3ae28e070c0f4157ffc52d", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.056236346079894056, "ground_truth": 0}, {"key": "9313988d26672c576f08e130c895edf20d8aa626", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.4186969229633923, "ground_truth": 0}, {"key": "9313988d26672c576f08e130c895edf20d8aa626", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.2494472191238295, "ground_truth": 0}, {"key": "9313988d26672c576f08e130c895edf20d8aa626", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.20561503637763995, "ground_truth": 0}, {"key": "9313988d26672c576f08e130c895edf20d8aa626", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.2200070990543833, "ground_truth": 0}, {"key": "9313988d26672c576f08e130c895edf20d8aa626", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.37022538757161894, "ground_truth": 0}, {"key": "72f4a6670ec7ec915c83d58bb0ebf152b1605bb6", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.25091279420313345, "ground_truth": 0}, {"key": "72f4a6670ec7ec915c83d58bb0ebf152b1605bb6", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.19072401847988615, "ground_truth": 0}, {"key": "72f4a6670ec7ec915c83d58bb0ebf152b1605bb6", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.5195213204874449, "ground_truth": 0}, {"key": "72f4a6670ec7ec915c83d58bb0ebf152b1605bb6", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.7162185975536056, "ground_truth": 0}, {"key": "72f4a6670ec7ec915c83d58bb0ebf152b1605bb6", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.2509127833309935, "ground_truth": 0}, {"key": "b73f50e29d5b2943eb315643bef8ee4e09f5605b", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.3140505593903148, "ground_truth": 0}, {"key": "b73f50e29d5b2943eb315643bef8ee4e09f5605b", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.40733340686231867, "ground_truth": 0}, {"key": "b73f50e29d5b2943eb315643bef8ee4e09f5605b", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.39420093267672907, "ground_truth": 0}, {"key": "b73f50e29d5b2943eb315643bef8ee4e09f5605b", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.29421495830801603, "ground_truth": 0}, {"key": "b73f50e29d5b2943eb315643bef8ee4e09f5605b", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.8944211613614256, "ground_truth": 0}, {"key": "f9689fb9656132e1c6d186851563f2b968643791", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.04958902617736707, "ground_truth": 0}, {"key": "f9689fb9656132e1c6d186851563f2b968643791", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.0736962704816563, "ground_truth": 0}, {"key": "f9689fb9656132e1c6d186851563f2b968643791", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.09602549067811333, "ground_truth": 0}, {"key": "f9689fb9656132e1c6d186851563f2b968643791", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.10970577376535368, "ground_truth": 0}, {"key": "f9689fb9656132e1c6d186851563f2b968643791", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.13846179005181147, "ground_truth": 0}, {"key": "63831b842812b1a3d05b04904a10d160fe7ad2af", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.3311197475487795, "ground_truth": 0}, {"key": "63831b842812b1a3d05b04904a10d160fe7ad2af", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.48047869654046527, "ground_truth": 0}, {"key": "63831b842812b1a3d05b04904a10d160fe7ad2af", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.5736784037408447, "ground_truth": 0}, {"key": "63831b842812b1a3d05b04904a10d160fe7ad2af", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.4436004225722406, "ground_truth": 0}, {"key": "63831b842812b1a3d05b04904a10d160fe7ad2af", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.36658974333947675, "ground_truth": 0}, {"key": "05688bac0e46542be65a6df240428a6f26c86fd0", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.35936413159930747, "ground_truth": 0}, {"key": "05688bac0e46542be65a6df240428a6f26c86fd0", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.17781086731986429, "ground_truth": 0}, {"key": "05688bac0e46542be65a6df240428a6f26c86fd0", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.5292633897566972, "ground_truth": 0}, {"key": "05688bac0e46542be65a6df240428a6f26c86fd0", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.4804786624819027, "ground_truth": 0}, {"key": "05688bac0e46542be65a6df240428a6f26c86fd0", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.46101678897654147, "ground_truth": 0}, {"key": "5ba0d22ccba29ac8a3c77da069165d6016f5a214", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.45519861332854444, "ground_truth": 0}, {"key": "5ba0d22ccba29ac8a3c77da069165d6016f5a214", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.6057990457213692, "ground_truth": 0}, {"key": "5ba0d22ccba29ac8a3c77da069165d6016f5a214", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.6495786262994016, "ground_truth": 0}, {"key": "5ba0d22ccba29ac8a3c77da069165d6016f5a214", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.6057990545565127, "ground_truth": 0}, {"key": "5ba0d22ccba29ac8a3c77da069165d6016f5a214", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.6169358088636384, "ground_truth": 0}, {"key": "9f63d6256158d260c426a9336d19b760d9bc5a48", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.5832033334328409, "ground_truth": 0}, {"key": "9f63d6256158d260c426a9336d19b760d9bc5a48", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.7853085786419849, "ground_truth": 0}, {"key": "9f63d6256158d260c426a9336d19b760d9bc5a48", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.2487166323602795, "ground_truth": 0}, {"key": "9f63d6256158d260c426a9336d19b760d9bc5a48", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.687629990791904, "ground_truth": 0}, {"key": "9f63d6256158d260c426a9336d19b760d9bc5a48", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.6085940376633058, "ground_truth": 0}, {"key": "fb6516de631cade629b797e8f40f377523c4aa0e", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.24077460546178012, "ground_truth": 0}, {"key": "fb6516de631cade629b797e8f40f377523c4aa0e", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.14804718689423615, "ground_truth": 0}, {"key": "fb6516de631cade629b797e8f40f377523c4aa0e", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.21733751900264514, "ground_truth": 0}, {"key": "fb6516de631cade629b797e8f40f377523c4aa0e", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.3867634330152411, "ground_truth": 0}, {"key": "fb6516de631cade629b797e8f40f377523c4aa0e", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.5679366072650108, "ground_truth": 0}, {"key": "0a71f063b78184b4ca2ffee3c642d48dc27ef91b", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.10017221916865185, "ground_truth": 0}, {"key": "0a71f063b78184b4ca2ffee3c642d48dc27ef91b", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.2704802358890933, "ground_truth": 0}, {"key": "0a71f063b78184b4ca2ffee3c642d48dc27ef91b", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.10017223047229773, "ground_truth": 0}, {"key": "0a71f063b78184b4ca2ffee3c642d48dc27ef91b", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.08694165778963003, "ground_truth": 0}, {"key": "0a71f063b78184b4ca2ffee3c642d48dc27ef91b", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.1329642469456292, "ground_truth": 0}, {"key": "700e0d133d2f5c2e65960aae7bffa66bb62c0df4", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.074500254710415, "ground_truth": 0}, {"key": "700e0d133d2f5c2e65960aae7bffa66bb62c0df4", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.1613202464743279, "ground_truth": 0}, {"key": "700e0d133d2f5c2e65960aae7bffa66bb62c0df4", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.4016878108448613, "ground_truth": 0}, {"key": "700e0d133d2f5c2e65960aae7bffa66bb62c0df4", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.17667160370621263, "ground_truth": 0}, {"key": "700e0d133d2f5c2e65960aae7bffa66bb62c0df4", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.22953521370190688, "ground_truth": 0}, {"key": "180642a2ddfce93ceaf3ee3ec4779400fe67ae1e", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.12002563805972229, "ground_truth": 0}, {"key": "180642a2ddfce93ceaf3ee3ec4779400fe67ae1e", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.030444350078242026, "ground_truth": 0}, {"key": "180642a2ddfce93ceaf3ee3ec4779400fe67ae1e", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.1710611813098097, "ground_truth": 0}, {"key": "180642a2ddfce93ceaf3ee3ec4779400fe67ae1e", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.2186693698854366, "ground_truth": 0}, {"key": "180642a2ddfce93ceaf3ee3ec4779400fe67ae1e", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.15102780187391446, "ground_truth": 0}, {"key": "3e868fbad714ceab14a41fa9dd5d8a40204f2199", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.8770561986631381, "ground_truth": 0}, {"key": "3e868fbad714ceab14a41fa9dd5d8a40204f2199", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.8740772259202797, "ground_truth": 0}, {"key": "3e868fbad714ceab14a41fa9dd5d8a40204f2199", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.887984041109052, "ground_truth": 0}, {"key": "3e868fbad714ceab14a41fa9dd5d8a40204f2199", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.90829303659494, "ground_truth": 0}, {"key": "3e868fbad714ceab14a41fa9dd5d8a40204f2199", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.8019358149582768, "ground_truth": 0}, {"key": "8b0a818edcbbefb79dd40a19b08119f6848083db", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.43302218079014937, "ground_truth": 0}, {"key": "8b0a818edcbbefb79dd40a19b08119f6848083db", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.7853085786419849, "ground_truth": 0}, {"key": "8b0a818edcbbefb79dd40a19b08119f6848083db", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.5058591040114191, "ground_truth": 0}, {"key": "8b0a818edcbbefb79dd40a19b08119f6848083db", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.5813030758522135, "ground_truth": 0}, {"key": "8b0a818edcbbefb79dd40a19b08119f6848083db", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.5583269806298391, "ground_truth": 0}, {"key": "ceb7a288ac1ad604a17bc25c5978fcc87b1a4446", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.14128142119896814, "ground_truth": 0}, {"key": "ceb7a288ac1ad604a17bc25c5978fcc87b1a4446", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.33982761708361, "ground_truth": 0}, {"key": "ceb7a288ac1ad604a17bc25c5978fcc87b1a4446", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.21866938135685893, "ground_truth": 0}, {"key": "ceb7a288ac1ad604a17bc25c5978fcc87b1a4446", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.27048022055686183, "ground_truth": 0}, {"key": "ceb7a288ac1ad604a17bc25c5978fcc87b1a4446", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.39981164962870036, "ground_truth": 0}, {"key": "a228e744966fe03eca515b971329acacf9feabb2", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.6992544108871523, "ground_truth": 0}, {"key": "a228e744966fe03eca515b971329acacf9feabb2", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.5926666080800699, "ground_truth": 0}, {"key": "a228e744966fe03eca515b971329acacf9feabb2", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.929440402668064, "ground_truth": 0}, {"key": "a228e744966fe03eca515b971329acacf9feabb2", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.39047583640070027, "ground_truth": 0}, {"key": "a228e744966fe03eca515b971329acacf9feabb2", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.20817895036263798, "ground_truth": 0}, {"key": "c44238ec87e7fc40ab7fe6e724cfcbf301e01216", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.05460060628674975, "ground_truth": 0}, {"key": "c44238ec87e7fc40ab7fe6e724cfcbf301e01216", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.06903792992015996, "ground_truth": 0}, {"key": "c44238ec87e7fc40ab7fe6e724cfcbf301e01216", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.12002563861380884, "ground_truth": 0}, {"key": "c44238ec87e7fc40ab7fe6e724cfcbf301e01216", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.10302442831279507, "ground_truth": 0}, {"key": "c44238ec87e7fc40ab7fe6e724cfcbf301e01216", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.40544873370766504, "ground_truth": 0}, {"key": "fff32094b00f3780cc98fe43bd98aace4b851281", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.5794004047951931, "ground_truth": 0}, {"key": "fff32094b00f3780cc98fe43bd98aace4b851281", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.40544871624789885, "ground_truth": 0}, {"key": "fff32094b00f3780cc98fe43bd98aace4b851281", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.3539862983354235, "ground_truth": 0}, {"key": "fff32094b00f3780cc98fe43bd98aace4b851281", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.7178037997412737, "ground_truth": 0}, {"key": "fff32094b00f3780cc98fe43bd98aace4b851281", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.46684560544603765, "ground_truth": 0}, {"key": "373ef5be1d84b8c4905193e569e0cf8a7ead3d03", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.6334102542628495, "ground_truth": 0}, {"key": "373ef5be1d84b8c4905193e569e0cf8a7ead3d03", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.32939171773136267, "ground_truth": 0}, {"key": "373ef5be1d84b8c4905193e569e0cf8a7ead3d03", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.4436004394858539, "ground_truth": 0}, {"key": "373ef5be1d84b8c4905193e569e0cf8a7ead3d03", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.5486734872231134, "ground_truth": 0}, {"key": "373ef5be1d84b8c4905193e569e0cf8a7ead3d03", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.8025555409848468, "ground_truth": 0}, {"key": "f372b28e3d1f74d60aa8ee29d7bdd49a6e7f9779", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.8757869887386496, "ground_truth": 0}, {"key": "f372b28e3d1f74d60aa8ee29d7bdd49a6e7f9779", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.6909762947108689, "ground_truth": 0}, {"key": "f372b28e3d1f74d60aa8ee29d7bdd49a6e7f9779", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.7634837884820207, "ground_truth": 0}, {"key": "f372b28e3d1f74d60aa8ee29d7bdd49a6e7f9779", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.8683809541133536, "ground_truth": 0}, {"key": "f372b28e3d1f74d60aa8ee29d7bdd49a6e7f9779", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.9324533088565105, "ground_truth": 0}, {"key": "fbcaa7519e9ff82193afbaed67d8706f2350125f", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.8629302186157616, "ground_truth": 0}, {"key": "fbcaa7519e9ff82193afbaed67d8706f2350125f", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.9658995734137567, "ground_truth": 0}, {"key": "fbcaa7519e9ff82193afbaed67d8706f2350125f", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.9164093322574403, "ground_truth": 0}, {"key": "fbcaa7519e9ff82193afbaed67d8706f2350125f", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.9376689670308106, "ground_truth": 0}, {"key": "fbcaa7519e9ff82193afbaed67d8706f2350125f", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.27048022116662623, "ground_truth": 0}, {"key": "5ebd041d89a2ba41b387c30293f0657eef746910", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.019197449773788375, "ground_truth": 0}, {"key": "5ebd041d89a2ba41b387c30293f0657eef746910", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.013532149068103648, "ground_truth": 0}, {"key": "5ebd041d89a2ba41b387c30293f0657eef746910", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.027480694028178366, "ground_truth": 0}, {"key": "5ebd041d89a2ba41b387c30293f0657eef746910", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.027376489628585483, "ground_truth": 0}, {"key": "5ebd041d89a2ba41b387c30293f0657eef746910", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.010818448020960502, "ground_truth": 0}, {"key": "ac4ae79796d05506dabe4380c24f7dd423e09965", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.19436781120974872, "ground_truth": 0}, {"key": "ac4ae79796d05506dabe4380c24f7dd423e09965", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.3380771296963397, "ground_truth": 0}, {"key": "ac4ae79796d05506dabe4380c24f7dd423e09965", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.4263215719933953, "ground_truth": 0}, {"key": "ac4ae79796d05506dabe4380c24f7dd423e09965", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.087563847785301, "ground_truth": 0}, {"key": "ac4ae79796d05506dabe4380c24f7dd423e09965", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.4610167791175811, "ground_truth": 0}, {"key": "62827a1a377491d88adcbac25ecf14a64b5f997b", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.7476159493037369, "ground_truth": 0}, {"key": "62827a1a377491d88adcbac25ecf14a64b5f997b", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.8433798272853664, "ground_truth": 0}, {"key": "62827a1a377491d88adcbac25ecf14a64b5f997b", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.9167080754672885, "ground_truth": 0}, {"key": "62827a1a377491d88adcbac25ecf14a64b5f997b", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.7766229473881181, "ground_truth": 0}, {"key": "62827a1a377491d88adcbac25ecf14a64b5f997b", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.9348724534644801, "ground_truth": 0}, {"key": "d42463e1093a92ec4dbd20edd8f4bf3306f00f3f", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.3023910772612059, "ground_truth": 0}, {"key": "d42463e1093a92ec4dbd20edd8f4bf3306f00f3f", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.41111085733855324, "ground_truth": 0}, {"key": "d42463e1093a92ec4dbd20edd8f4bf3306f00f3f", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.35936413174515935, "ground_truth": 0}, {"key": "d42463e1093a92ec4dbd20edd8f4bf3306f00f3f", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.26284184806812705, "ground_truth": 0}, {"key": "d42463e1093a92ec4dbd20edd8f4bf3306f00f3f", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.45132652142487734, "ground_truth": 0}, {"key": "4b0eda92463958cce8c6b2537db39088e1254552", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.08601588450529504, "ground_truth": 0}, {"key": "4b0eda92463958cce8c6b2537db39088e1254552", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.235108396558913, "ground_truth": 0}, {"key": "4b0eda92463958cce8c6b2537db39088e1254552", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.07504072666892429, "ground_truth": 0}, {"key": "4b0eda92463958cce8c6b2537db39088e1254552", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.06804042489272752, "ground_truth": 0}, {"key": "4b0eda92463958cce8c6b2537db39088e1254552", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.06979492383114098, "ground_truth": 0}, {"key": "e117408ad19cc69e15b1e21b9ae54f10c07223ce", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.1871326830112543, "ground_truth": 0}, {"key": "e117408ad19cc69e15b1e21b9ae54f10c07223ce", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.15456732471549436, "ground_truth": 0}, {"key": "e117408ad19cc69e15b1e21b9ae54f10c07223ce", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.18832398047019647, "ground_truth": 0}, {"key": "e117408ad19cc69e15b1e21b9ae54f10c07223ce", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.052424561434376196, "ground_truth": 0}, {"key": "e117408ad19cc69e15b1e21b9ae54f10c07223ce", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.2186693785681319, "ground_truth": 0}, {"key": "3c5b68b58c34853baa534d1265ec7fde00d4eb4e", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.14318770961759308, "ground_truth": 0}, {"key": "3c5b68b58c34853baa534d1265ec7fde00d4eb4e", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.18713268057222418, "ground_truth": 0}, {"key": "3c5b68b58c34853baa534d1265ec7fde00d4eb4e", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.2351083844957359, "ground_truth": 0}, {"key": "3c5b68b58c34853baa534d1265ec7fde00d4eb4e", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.08945460305236513, "ground_truth": 0}, {"key": "3c5b68b58c34853baa534d1265ec7fde00d4eb4e", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.14366761028750297, "ground_truth": 0}, {"key": "6c3d2feed04c75063d182103f0585c45da9aaa1b", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.18832399313759599, "ground_truth": 0}, {"key": "6c3d2feed04c75063d182103f0585c45da9aaa1b", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.2751297152620171, "ground_truth": 0}, {"key": "6c3d2feed04c75063d182103f0585c45da9aaa1b", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.11757213843438825, "ground_truth": 0}, {"key": "6c3d2feed04c75063d182103f0585c45da9aaa1b", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.5544704519222672, "ground_truth": 0}, {"key": "6c3d2feed04c75063d182103f0585c45da9aaa1b", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.16667539394509667, "ground_truth": 0}, {"key": "4fa1c0bd7f86368d7ae7730d95ff7e73dc9172da", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.4397473470461678, "ground_truth": 0}, {"key": "4fa1c0bd7f86368d7ae7730d95ff7e73dc9172da", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.7819972855140879, "ground_truth": 0}, {"key": "4fa1c0bd7f86368d7ae7730d95ff7e73dc9172da", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.9869292152002832, "ground_truth": 0}, {"key": "4fa1c0bd7f86368d7ae7730d95ff7e73dc9172da", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.8998277769382182, "ground_truth": 0}, {"key": "4fa1c0bd7f86368d7ae7730d95ff7e73dc9172da", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.9741412221085756, "ground_truth": 0}, {"key": "282f1910bd57e50d4401c695ebe75b817de68548", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.1412814206320431, "ground_truth": 0}, {"key": "282f1910bd57e50d4401c695ebe75b817de68548", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.036220058140451906, "ground_truth": 0}, {"key": "282f1910bd57e50d4401c695ebe75b817de68548", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.13477591873729877, "ground_truth": 0}, {"key": "282f1910bd57e50d4401c695ebe75b817de68548", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.0786423860267702, "ground_truth": 0}, {"key": "282f1910bd57e50d4401c695ebe75b817de68548", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.04831607210387598, "ground_truth": 0}, {"key": "af2d712599be471d1ba0b91fa18c347220ca595d", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.04655127343706377, "ground_truth": 0}, {"key": "af2d712599be471d1ba0b91fa18c347220ca595d", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.030329258993029806, "ground_truth": 0}, {"key": "af2d712599be471d1ba0b91fa18c347220ca595d", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.06371499790013728, "ground_truth": 0}, {"key": "af2d712599be471d1ba0b91fa18c347220ca595d", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.05791808400459666, "ground_truth": 0}, {"key": "af2d712599be471d1ba0b91fa18c347220ca595d", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.030675800158895736, "ground_truth": 0}, {"key": "e3dd06d326c8d53722bdc5c8428e29c68a60d0d5", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.9600626817890876, "ground_truth": 0}, {"key": "e3dd06d326c8d53722bdc5c8428e29c68a60d0d5", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.9756698094872257, "ground_truth": 0}, {"key": "e3dd06d326c8d53722bdc5c8428e29c68a60d0d5", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.9563089409170852, "ground_truth": 0}, {"key": "e3dd06d326c8d53722bdc5c8428e29c68a60d0d5", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.9346342163481729, "ground_truth": 0}, {"key": "e3dd06d326c8d53722bdc5c8428e29c68a60d0d5", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.9341552986399155, "ground_truth": 0}, {"key": "493fa8c40d1bc26ed1d25633c779b13bc33efdba", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.16885695036151907, "ground_truth": 0}, {"key": "493fa8c40d1bc26ed1d25633c779b13bc33efdba", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.12252321170515551, "ground_truth": 0}, {"key": "493fa8c40d1bc26ed1d25633c779b13bc33efdba", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.13477591719117446, "ground_truth": 0}, {"key": "493fa8c40d1bc26ed1d25633c779b13bc33efdba", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.23510837991923117, "ground_truth": 0}, {"key": "493fa8c40d1bc26ed1d25633c779b13bc33efdba", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.11047114671538046, "ground_truth": 0}, {"key": "56d7d67bb0fc32ee71cc006b915244776d883661", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.14903529368334348, "ground_truth": 0}, {"key": "56d7d67bb0fc32ee71cc006b915244776d883661", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.09947020854374512, "ground_truth": 0}, {"key": "56d7d67bb0fc32ee71cc006b915244776d883661", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.03963884164041434, "ground_truth": 0}, {"key": "56d7d67bb0fc32ee71cc006b915244776d883661", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.03197956097039117, "ground_truth": 0}, {"key": "56d7d67bb0fc32ee71cc006b915244776d883661", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.012194134030227422, "ground_truth": 0}, {"key": "2b08ee205946dc0bb6ffe0db654cbbba1199eb28", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.14804718059988903, "ground_truth": 0}, {"key": "2b08ee205946dc0bb6ffe0db654cbbba1199eb28", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.0940101902741903, "ground_truth": 0}, {"key": "2b08ee205946dc0bb6ffe0db654cbbba1199eb28", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.20307464386995527, "ground_truth": 0}, {"key": "2b08ee205946dc0bb6ffe0db654cbbba1199eb28", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.12002562977636552, "ground_truth": 0}, {"key": "2b08ee205946dc0bb6ffe0db654cbbba1199eb28", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.07613248329098628, "ground_truth": 0}, {"key": "782c4bdaee73189103d2e05748717b3ea0e89e5d", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.3830641775447951, "ground_truth": 0}, {"key": "782c4bdaee73189103d2e05748717b3ea0e89e5d", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.5370413994200224, "ground_truth": 0}, {"key": "782c4bdaee73189103d2e05748717b3ea0e89e5d", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.29910519344322517, "ground_truth": 0}, {"key": "782c4bdaee73189103d2e05748717b3ea0e89e5d", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.26133092037033534, "ground_truth": 0}, {"key": "782c4bdaee73189103d2e05748717b3ea0e89e5d", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.8868130927954507, "ground_truth": 0}, {"key": "87385fb51ac9eaf76e8421723c94410f724750fc", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.8294920012787202, "ground_truth": 0}, {"key": "87385fb51ac9eaf76e8421723c94410f724750fc", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.8381505561354707, "ground_truth": 0}, {"key": "87385fb51ac9eaf76e8421723c94410f724750fc", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.6325027488653484, "ground_truth": 0}, {"key": "87385fb51ac9eaf76e8421723c94410f724750fc", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.7446563452443943, "ground_truth": 0}, {"key": "87385fb51ac9eaf76e8421723c94410f724750fc", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.8407826026223914, "ground_truth": 0}, {"key": "20528eb48341b50c0083fcf5a9d114b39040e5c1", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.15921739862478468, "ground_truth": 0}, {"key": "20528eb48341b50c0083fcf5a9d114b39040e5c1", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.1699562337452392, "ground_truth": 0}, {"key": "20528eb48341b50c0083fcf5a9d114b39040e5c1", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.3647775710326888, "ground_truth": 0}, {"key": "20528eb48341b50c0083fcf5a9d114b39040e5c1", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.27048023137817295, "ground_truth": 0}, {"key": "20528eb48341b50c0083fcf5a9d114b39040e5c1", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.5214711608809695, "ground_truth": 0}, {"key": "412630c97420afb50e5278d3406e0cf4b08d0b77", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.09947020501066813, "ground_truth": 0}, {"key": "412630c97420afb50e5278d3406e0cf4b08d0b77", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.06730107908194562, "ground_truth": 0}, {"key": "412630c97420afb50e5278d3406e0cf4b08d0b77", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.04778006856857453, "ground_truth": 0}, {"key": "412630c97420afb50e5278d3406e0cf4b08d0b77", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.11961367268437799, "ground_truth": 0}, {"key": "412630c97420afb50e5278d3406e0cf4b08d0b77", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.07290026615329995, "ground_truth": 0}, {"key": "dcd60a85e1e17ec0163a925c9412d480fd08072f", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.26133092619849696, "ground_truth": 0}, {"key": "dcd60a85e1e17ec0163a925c9412d480fd08072f", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.37845909829345414, "ground_truth": 0}, {"key": "dcd60a85e1e17ec0163a925c9412d480fd08072f", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.2081789393061634, "ground_truth": 0}, {"key": "dcd60a85e1e17ec0163a925c9412d480fd08072f", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.24944723203525052, "ground_truth": 0}, {"key": "dcd60a85e1e17ec0163a925c9412d480fd08072f", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.39420094112074316, "ground_truth": 0}, {"key": "805644d370fae7b0492174c54c00e86eff742735", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.07185126970641216, "ground_truth": 0}, {"key": "805644d370fae7b0492174c54c00e86eff742735", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.09877258932097308, "ground_truth": 0}, {"key": "805644d370fae7b0492174c54c00e86eff742735", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.09636510575928157, "ground_truth": 0}, {"key": "805644d370fae7b0492174c54c00e86eff742735", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.06681232823402881, "ground_truth": 0}, {"key": "805644d370fae7b0492174c54c00e86eff742735", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.09009299792990227, "ground_truth": 0}, {"key": "3aa0ef8cac31a60076c43a9484792b59372edb64", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.38676342752844983, "ground_truth": 0}, {"key": "3aa0ef8cac31a60076c43a9484792b59372edb64", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.4225046224485281, "ground_truth": 0}, {"key": "3aa0ef8cac31a60076c43a9484792b59372edb64", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.37387582507052775, "ground_truth": 0}, {"key": "3aa0ef8cac31a60076c43a9484792b59372edb64", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.6636689546383221, "ground_truth": 0}, {"key": "3aa0ef8cac31a60076c43a9484792b59372edb64", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.6619228613178213, "ground_truth": 0}, {"key": "4cf51ce9372dff8ff7f44f098eab1c1d7569af7a", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.31742628988781757, "ground_truth": 0}, {"key": "4cf51ce9372dff8ff7f44f098eab1c1d7569af7a", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.7613610901920157, "ground_truth": 0}, {"key": "4cf51ce9372dff8ff7f44f098eab1c1d7569af7a", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.8795611880045872, "ground_truth": 0}, {"key": "4cf51ce9372dff8ff7f44f098eab1c1d7569af7a", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.2186693779921628, "ground_truth": 0}, {"key": "4cf51ce9372dff8ff7f44f098eab1c1d7569af7a", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.44167301890788147, "ground_truth": 0}, {"key": "ea06fd0b25cb9793397a51de73fd83f91b4323fa", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.29340448289938387, "ground_truth": 0}, {"key": "ea06fd0b25cb9793397a51de73fd83f91b4323fa", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.27982850073205134, "ground_truth": 0}, {"key": "ea06fd0b25cb9793397a51de73fd83f91b4323fa", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.28378138998120206, "ground_truth": 0}, {"key": "ea06fd0b25cb9793397a51de73fd83f91b4323fa", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.20181321846603006, "ground_truth": 0}, {"key": "ea06fd0b25cb9793397a51de73fd83f91b4323fa", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.17553806356906168, "ground_truth": 0}, {"key": "a150e93fa52eaba281aae9eabe28b3ee4155f296", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.4101654996843854, "ground_truth": 0}, {"key": "a150e93fa52eaba281aae9eabe28b3ee4155f296", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.26740817765977815, "ground_truth": 0}, {"key": "a150e93fa52eaba281aae9eabe28b3ee4155f296", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.4263215708609846, "ground_truth": 0}, {"key": "a150e93fa52eaba281aae9eabe28b3ee4155f296", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.14318770659220434, "ground_truth": 0}, {"key": "a150e93fa52eaba281aae9eabe28b3ee4155f296", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.5554352491521797, "ground_truth": 0}, {"key": "a0a84718168357049273f6e65133fd06e67cd6d2", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.2798284978564536, "ground_truth": 0}, {"key": "a0a84718168357049273f6e65133fd06e67cd6d2", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.2720245676233188, "ground_truth": 0}, {"key": "a0a84718168357049273f6e65133fd06e67cd6d2", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.09334687504933331, "ground_truth": 0}, {"key": "a0a84718168357049273f6e65133fd06e67cd6d2", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.06325052242634503, "ground_truth": 0}, {"key": "a0a84718168357049273f6e65133fd06e67cd6d2", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.2689414392414335, "ground_truth": 0}, {"key": "b5833a27ee69d7540435e3c70af040c2b743f541", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.04451442892586344, "ground_truth": 0}, {"key": "b5833a27ee69d7540435e3c70af040c2b743f541", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.08850466774702279, "ground_truth": 0}, {"key": "b5833a27ee69d7540435e3c70af040c2b743f541", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.02887090703298613, "ground_truth": 0}, {"key": "b5833a27ee69d7540435e3c70af040c2b743f541", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.060086643440709527, "ground_truth": 0}, {"key": "b5833a27ee69d7540435e3c70af040c2b743f541", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.03488088885697733, "ground_truth": 0}, {"key": "98dbba54da2a05bb04320aa0e4fb05fba3d75b63", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.014842418127103378, "ground_truth": 0}, {"key": "98dbba54da2a05bb04320aa0e4fb05fba3d75b63", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.012479699821302617, "ground_truth": 0}, {"key": "98dbba54da2a05bb04320aa0e4fb05fba3d75b63", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.014957086398658509, "ground_truth": 0}, {"key": "98dbba54da2a05bb04320aa0e4fb05fba3d75b63", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.016215031034827423, "ground_truth": 0}, {"key": "98dbba54da2a05bb04320aa0e4fb05fba3d75b63", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.012920473253377243, "ground_truth": 0}, {"key": "4a30d8e9ba08a56c1d503d719525113545c414e3", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.10856641316578879, "ground_truth": 0}, {"key": "4a30d8e9ba08a56c1d503d719525113545c414e3", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.3259495271015606, "ground_truth": 0}, {"key": "4a30d8e9ba08a56c1d503d719525113545c414e3", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.1732882037119675, "ground_truth": 0}, {"key": "4a30d8e9ba08a56c1d503d719525113545c414e3", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.05834583879419109, "ground_truth": 0}, {"key": "4a30d8e9ba08a56c1d503d719525113545c414e3", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.17217185946634114, "ground_truth": 0}, {"key": "c3acabb0c18cc7615eb3796406500fba1b148d3d", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.09534946324679015, "ground_truth": 0}, {"key": "c3acabb0c18cc7615eb3796406500fba1b148d3d", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.06730108164984704, "ground_truth": 0}, {"key": "c3acabb0c18cc7615eb3796406500fba1b148d3d", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.1366084090221621, "ground_truth": 0}, {"key": "c3acabb0c18cc7615eb3796406500fba1b148d3d", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.2845759969874162, "ground_truth": 0}, {"key": "c3acabb0c18cc7615eb3796406500fba1b148d3d", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.18126320861915007, "ground_truth": 0}, {"key": "1c1acc74329fe61636f900df9dbcef5ed695e5c9", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.13206614571651898, "ground_truth": 0}, {"key": "1c1acc74329fe61636f900df9dbcef5ed695e5c9", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.1135795911065287, "ground_truth": 0}, {"key": "1c1acc74329fe61636f900df9dbcef5ed695e5c9", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.10970577217039552, "ground_truth": 0}, {"key": "1c1acc74329fe61636f900df9dbcef5ed695e5c9", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.11757213217370907, "ground_truth": 0}, {"key": "1c1acc74329fe61636f900df9dbcef5ed695e5c9", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.09467770879027552, "ground_truth": 0}, {"key": "f70a7abb6c5b0ef383ea12a4d9ca046a5bd854e5", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.293404489114891, "ground_truth": 0}, {"key": "f70a7abb6c5b0ef383ea12a4d9ca046a5bd854e5", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.4474603053802145, "ground_truth": 0}, {"key": "f70a7abb6c5b0ef383ea12a4d9ca046a5bd854e5", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.2925953277036458, "ground_truth": 0}, {"key": "f70a7abb6c5b0ef383ea12a4d9ca046a5bd854e5", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.24798743826196207, "ground_truth": 0}, {"key": "f70a7abb6c5b0ef383ea12a4d9ca046a5bd854e5", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.42632158638546375, "ground_truth": 0}, {"key": "a3dd38ec7bc9d7e8423b96d8fd0641a2a5d5c984", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.5234203611302933, "ground_truth": 0}, {"key": "a3dd38ec7bc9d7e8423b96d8fd0641a2a5d5c984", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.5945512753329383, "ground_truth": 0}, {"key": "a3dd38ec7bc9d7e8423b96d8fd0641a2a5d5c984", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.544801386351283, "ground_truth": 0}, {"key": "a3dd38ec7bc9d7e8423b96d8fd0641a2a5d5c984", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.4301473417346658, "ground_truth": 0}, {"key": "a3dd38ec7bc9d7e8423b96d8fd0641a2a5d5c984", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.3720487835468814, "ground_truth": 0}, {"key": "654c6b29b96d2a5a818d91400c20f838b0e8b6df", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.06418264090733071, "ground_truth": 0}, {"key": "654c6b29b96d2a5a818d91400c20f838b0e8b6df", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.17953055883810135, "ground_truth": 0}, {"key": "654c6b29b96d2a5a818d91400c20f838b0e8b6df", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.07921032313587154, "ground_truth": 0}, {"key": "654c6b29b96d2a5a818d91400c20f838b0e8b6df", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.3242354163478713, "ground_truth": 0}, {"key": "654c6b29b96d2a5a818d91400c20f838b0e8b6df", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.10017222289730705, "ground_truth": 0}, {"key": "764d9ce99a1e3f79d95fbc4b68adbce14e7f8bcd", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.6388352781257708, "ground_truth": 0}, {"key": "764d9ce99a1e3f79d95fbc4b68adbce14e7f8bcd", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.8449215439413101, "ground_truth": 0}, {"key": "764d9ce99a1e3f79d95fbc4b68adbce14e7f8bcd", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.7819972876673815, "ground_truth": 0}, {"key": "764d9ce99a1e3f79d95fbc4b68adbce14e7f8bcd", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.9136765233757491, "ground_truth": 0}, {"key": "764d9ce99a1e3f79d95fbc4b68adbce14e7f8bcd", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.8670357557022613, "ground_truth": 0}, {"key": "f16446db34e2861f0450dfa34d8cdda541ab7b19", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.04177388119779759, "ground_truth": 0}, {"key": "f16446db34e2861f0450dfa34d8cdda541ab7b19", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.32594952474360983, "ground_truth": 0}, {"key": "f16446db34e2861f0450dfa34d8cdda541ab7b19", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.14318770492844882, "ground_truth": 0}, {"key": "f16446db34e2861f0450dfa34d8cdda541ab7b19", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.1655931086643133, "ground_truth": 0}, {"key": "f16446db34e2861f0450dfa34d8cdda541ab7b19", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.15002881957412892, "ground_truth": 0}, {"key": "3e910c5b8425cd7c871a402a32ca44680b53ce5e", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.11436851869092575, "ground_truth": 0}, {"key": "3e910c5b8425cd7c871a402a32ca44680b53ce5e", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.05921025188782028, "ground_truth": 0}, {"key": "3e910c5b8425cd7c871a402a32ca44680b53ce5e", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.2735743959091144, "ground_truth": 0}, {"key": "3e910c5b8425cd7c871a402a32ca44680b53ce5e", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.11838509940797007, "ground_truth": 0}, {"key": "3e910c5b8425cd7c871a402a32ca44680b53ce5e", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.1431876998296092, "ground_truth": 0}, {"key": "973c14551fc97a1eef094bd0f33356d9e6836234", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.08122775650294738, "ground_truth": 0}, {"key": "973c14551fc97a1eef094bd0f33356d9e6836234", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.2173375157100633, "ground_truth": 0}, {"key": "973c14551fc97a1eef094bd0f33356d9e6836234", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.08181271257938025, "ground_truth": 0}, {"key": "973c14551fc97a1eef094bd0f33356d9e6836234", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.08882029028847685, "ground_truth": 0}, {"key": "973c14551fc97a1eef094bd0f33356d9e6836234", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.055412791434825866, "ground_truth": 0}, {"key": "725938611c7dca6f876ada93b1d68b29ad25ce38", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.07423136558883868, "ground_truth": 0}, {"key": "725938611c7dca6f876ada93b1d68b29ad25ce38", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.09467770571817391, "ground_truth": 0}, {"key": "725938611c7dca6f876ada93b1d68b29ad25ce38", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.08479540255768281, "ground_truth": 0}, {"key": "725938611c7dca6f876ada93b1d68b29ad25ce38", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.33807713391223687, "ground_truth": 0}, {"key": "725938611c7dca6f876ada93b1d68b29ad25ce38", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.0742313673498334, "ground_truth": 0}, {"key": "28dbcf0c8624d9914a4e4292f872f17b063547c2", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.5544704554765876, "ground_truth": 0}, {"key": "28dbcf0c8624d9914a4e4292f872f17b063547c2", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.9210741191731573, "ground_truth": 0}, {"key": "28dbcf0c8624d9914a4e4292f872f17b063547c2", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.8413048072828321, "ground_truth": 0}, {"key": "28dbcf0c8624d9914a4e4292f872f17b063547c2", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.3611647172574458, "ground_truth": 0}, {"key": "28dbcf0c8624d9914a4e4292f872f17b063547c2", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.6206216151094613, "ground_truth": 0}, {"key": "4567b2098569ee4346cfdede5819257af4ee9c0f", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.7669924737182738, "ground_truth": 0}, {"key": "4567b2098569ee4346cfdede5819257af4ee9c0f", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.8311430403606604, "ground_truth": 0}, {"key": "4567b2098569ee4346cfdede5819257af4ee9c0f", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.4941408994357375, "ground_truth": 0}, {"key": "4567b2098569ee4346cfdede5819257af4ee9c0f", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.8316905593060591, "ground_truth": 0}, {"key": "4567b2098569ee4346cfdede5819257af4ee9c0f", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.5832033443036246, "ground_truth": 0}, {"key": "d0404188997ef57e0355b18fb867599b89c80407", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.02920129245315196, "ground_truth": 0}, {"key": "d0404188997ef57e0355b18fb867599b89c80407", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.027690256740425277, "ground_truth": 0}, {"key": "d0404188997ef57e0355b18fb867599b89c80407", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.02635535369782168, "ground_truth": 0}, {"key": "d0404188997ef57e0355b18fb867599b89c80407", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.08299414744380344, "ground_truth": 0}, {"key": "d0404188997ef57e0355b18fb867599b89c80407", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.017375664774952452, "ground_truth": 0}, {"key": "ab10b3f8c4a6cca7aea94298447b13bc0721fe69", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.35220177632511634, "ground_truth": 0}, {"key": "ab10b3f8c4a6cca7aea94298447b13bc0721fe69", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.15203225663972, "ground_truth": 0}, {"key": "ab10b3f8c4a6cca7aea94298447b13bc0721fe69", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.36840572086168194, "ground_truth": 0}, {"key": "ab10b3f8c4a6cca7aea94298447b13bc0721fe69", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.3090237110524024, "ground_truth": 0}, {"key": "ab10b3f8c4a6cca7aea94298447b13bc0721fe69", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.37204880194610457, "ground_truth": 0}, {"key": "7c11a3353593edde95bae0ee6178fb1d1855baed", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.01778038887772215, "ground_truth": 0}, {"key": "7c11a3353593edde95bae0ee6178fb1d1855baed", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.06325052344781368, "ground_truth": 0}, {"key": "7c11a3353593edde95bae0ee6178fb1d1855baed", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.0227157554569239, "ground_truth": 0}, {"key": "7c11a3353593edde95bae0ee6178fb1d1855baed", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.0414622727332812, "ground_truth": 0}, {"key": "7c11a3353593edde95bae0ee6178fb1d1855baed", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.05261895757768256, "ground_truth": 0}, {"key": "487b272b94a620f9660e89bbf6ebab3ffdf1bf06", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.11162800098435742, "ground_truth": 0}, {"key": "487b272b94a620f9660e89bbf6ebab3ffdf1bf06", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.14953138705680016, "ground_truth": 0}, {"key": "487b272b94a620f9660e89bbf6ebab3ffdf1bf06", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.17106117267211496, "ground_truth": 0}, {"key": "487b272b94a620f9660e89bbf6ebab3ffdf1bf06", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.056444024871883526, "ground_truth": 0}, {"key": "487b272b94a620f9660e89bbf6ebab3ffdf1bf06", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.3090237059489783, "ground_truth": 0}, {"key": "e1b6f4701835710d3f518729188754fcd7061289", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.0378924258499481, "ground_truth": 0}, {"key": "e1b6f4701835710d3f518729188754fcd7061289", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.22815649116502879, "ground_truth": 0}, {"key": "e1b6f4701835710d3f518729188754fcd7061289", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.35042138540858214, "ground_truth": 0}, {"key": "e1b6f4701835710d3f518729188754fcd7061289", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.18010666694728722, "ground_truth": 0}, {"key": "e1b6f4701835710d3f518729188754fcd7061289", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.2509128021011543, "ground_truth": 0}, {"key": "45027afbe54056c567ca8a48906dd06200f6d8c1", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.468790621884464, "ground_truth": 0}, {"key": "45027afbe54056c567ca8a48906dd06200f6d8c1", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.6279512143329697, "ground_truth": 0}, {"key": "45027afbe54056c567ca8a48906dd06200f6d8c1", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.312370007503796, "ground_truth": 0}, {"key": "45027afbe54056c567ca8a48906dd06200f6d8c1", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.6187804202770224, "ground_truth": 0}, {"key": "45027afbe54056c567ca8a48906dd06200f6d8c1", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.6132365654488122, "ground_truth": 0}, {"key": "e8c2d4a1d20efb0606506435ebcbf486e9eb4146", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.14903530760658945, "ground_truth": 0}, {"key": "e8c2d4a1d20efb0606506435ebcbf486e9eb4146", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.388618010580664, "ground_truth": 0}, {"key": "e8c2d4a1d20efb0606506435ebcbf486e9eb4146", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.3040416834471886, "ground_truth": 0}, {"key": "e8c2d4a1d20efb0606506435ebcbf486e9eb4146", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.10594827838654626, "ground_truth": 0}, {"key": "e8c2d4a1d20efb0606506435ebcbf486e9eb4146", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.20946968306089223, "ground_truth": 0}, {"key": "da0ea6b7eae20528c7ec822fb77d8e8f78ba09b8", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.09203286083544415, "ground_truth": 0}, {"key": "da0ea6b7eae20528c7ec822fb77d8e8f78ba09b8", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.2030746381232071, "ground_truth": 0}, {"key": "da0ea6b7eae20528c7ec822fb77d8e8f78ba09b8", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.3904758397365244, "ground_truth": 0}, {"key": "da0ea6b7eae20528c7ec822fb77d8e8f78ba09b8", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.187727601210226, "ground_truth": 0}, {"key": "da0ea6b7eae20528c7ec822fb77d8e8f78ba09b8", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.180106666194895, "ground_truth": 0}, {"key": "42ab0385b3bb93236804c2abc9ff261b6ec79872", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.07531230648526245, "ground_truth": 0}, {"key": "42ab0385b3bb93236804c2abc9ff261b6ec79872", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.049039621212871747, "ground_truth": 0}, {"key": "42ab0385b3bb93236804c2abc9ff261b6ec79872", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.016029146853339223, "ground_truth": 0}, {"key": "42ab0385b3bb93236804c2abc9ff261b6ec79872", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.04401865510199249, "ground_truth": 0}, {"key": "42ab0385b3bb93236804c2abc9ff261b6ec79872", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.08479540328542523, "ground_truth": 0}, {"key": "3ad31f0dd26f2dce06da1c10ced8d601bd5594c5", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.20434190087717666, "ground_truth": 0}, {"key": "3ad31f0dd26f2dce06da1c10ced8d601bd5594c5", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.09807932360597188, "ground_truth": 0}, {"key": "3ad31f0dd26f2dce06da1c10ced8d601bd5594c5", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.49218811298081944, "ground_truth": 0}, {"key": "3ad31f0dd26f2dce06da1c10ced8d601bd5594c5", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.1835936295392964, "ground_truth": 0}, {"key": "3ad31f0dd26f2dce06da1c10ced8d601bd5594c5", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.31742627918795735, "ground_truth": 0}, {"key": "a142b867b5b52449a790e8a2942654fd880cd2e4", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.13117322116178343, "ground_truth": 0}, {"key": "a142b867b5b52449a790e8a2942654fd880cd2e4", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.5350984074684584, "ground_truth": 0}, {"key": "a142b867b5b52449a790e8a2942654fd880cd2e4", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.3539863153167644, "ground_truth": 0}, {"key": "a142b867b5b52449a790e8a2942654fd880cd2e4", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.2735743902027931, "ground_truth": 0}, {"key": "a142b867b5b52449a790e8a2942654fd880cd2e4", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.3486451447640044, "ground_truth": 0}, {"key": "04b39ee42fdc4284e402fbf7cdc7b825748f38b5", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.6926419893797074, "ground_truth": 0}, {"key": "04b39ee42fdc4284e402fbf7cdc7b825748f38b5", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.6370308216964651, "ground_truth": 0}, {"key": "04b39ee42fdc4284e402fbf7cdc7b825748f38b5", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.15507848497018373, "ground_truth": 0}, {"key": "04b39ee42fdc4284e402fbf7cdc7b825748f38b5", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.5736784270239605, "ground_truth": 0}, {"key": "04b39ee42fdc4284e402fbf7cdc7b825748f38b5", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.5273165308542505, "ground_truth": 0}, {"key": "ddafab36467762e9f1856687a7ef0e801243dace", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.9608048688810782, "ground_truth": 0}, {"key": "ddafab36467762e9f1856687a7ef0e801243dace", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.8428631396293687, "ground_truth": 0}, {"key": "ddafab36467762e9f1856687a7ef0e801243dace", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.9783846686581857, "ground_truth": 0}, {"key": "ddafab36467762e9f1856687a7ef0e801243dace", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.8128673098699076, "ground_truth": 0}, {"key": "ddafab36467762e9f1856687a7ef0e801243dace", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.8799743777229438, "ground_truth": 0}, {"key": "6c177720c8623edcaefc45111018f98811c29693", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.4571367322081923, "ground_truth": 0}, {"key": "6c177720c8623edcaefc45111018f98811c29693", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.15507847260272903, "ground_truth": 0}, {"key": "6c177720c8623edcaefc45111018f98811c29693", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.39233681948641325, "ground_truth": 0}, {"key": "6c177720c8623edcaefc45111018f98811c29693", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.33633104940161124, "ground_truth": 0}, {"key": "6c177720c8623edcaefc45111018f98811c29693", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.5525396939170398, "ground_truth": 0}, {"key": "5365dfc7c7079ade7d090530f5ce0d8995a8f1cc", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.11279539440578203, "ground_truth": 0}, {"key": "5365dfc7c7079ade7d090530f5ce0d8995a8f1cc", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.2436424479268424, "ground_truth": 0}, {"key": "5365dfc7c7079ade7d090530f5ce0d8995a8f1cc", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.1919327869638606, "ground_truth": 0}, {"key": "5365dfc7c7079ade7d090530f5ce0d8995a8f1cc", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.15304215639821436, "ground_truth": 0}, {"key": "5365dfc7c7079ade7d090530f5ce0d8995a8f1cc", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.282988120240806, "ground_truth": 0}, {"key": "6235695e9e69aa35c488636fc63bae84d1e2ca1f", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.14223188358620215, "ground_truth": 0}, {"key": "6235695e9e69aa35c488636fc63bae84d1e2ca1f", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.1925393520275896, "ground_truth": 0}, {"key": "6235695e9e69aa35c488636fc63bae84d1e2ca1f", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.08601587935922644, "ground_truth": 0}, {"key": "6235695e9e69aa35c488636fc63bae84d1e2ca1f", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.34334174758182306, "ground_truth": 0}, {"key": "6235695e9e69aa35c488636fc63bae84d1e2ca1f", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.2950267717307923, "ground_truth": 0}, {"key": "d954f33da49f4c839a6f4dadc446a4c30328c572", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.07585818393250146, "ground_truth": 0}, {"key": "d954f33da49f4c839a6f4dadc446a4c30328c572", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.5273165142199251, "ground_truth": 0}, {"key": "d954f33da49f4c839a6f4dadc446a4c30328c572", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.13028542140216617, "ground_truth": 0}, {"key": "d954f33da49f4c839a6f4dadc446a4c30328c572", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.06008664788881063, "ground_truth": 0}, {"key": "d954f33da49f4c839a6f4dadc446a4c30328c572", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.16995624340692467, "ground_truth": 0}, {"key": "5bdab1456ce6156a7378edaa4fa92a718cbf2568", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.17895589031251982, "ground_truth": 0}, {"key": "5bdab1456ce6156a7378edaa4fa92a718cbf2568", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.1634454295336147, "ground_truth": 0}, {"key": "5bdab1456ce6156a7378edaa4fa92a718cbf2568", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.12336562229047224, "ground_truth": 0}, {"key": "5bdab1456ce6156a7378edaa4fa92a718cbf2568", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.1097057701944599, "ground_truth": 0}, {"key": "5bdab1456ce6156a7378edaa4fa92a718cbf2568", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.05921025557604084, "ground_truth": 0}, {"key": "c03cd67baa8d84240b962876a5aaa2036d4f5275", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.05582313882831209, "ground_truth": 0}, {"key": "c03cd67baa8d84240b962876a5aaa2036d4f5275", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.181263215004222, "ground_truth": 0}, {"key": "c03cd67baa8d84240b962876a5aaa2036d4f5275", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.04940524651674238, "ground_truth": 0}, {"key": "c03cd67baa8d84240b962876a5aaa2036d4f5275", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.04707418110664149, "ground_truth": 0}, {"key": "c03cd67baa8d84240b962876a5aaa2036d4f5275", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.032961244253515376, "ground_truth": 0}, {"key": "e2847808e1990f51cd54eccd660640c44638f088", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.7248702638236026, "ground_truth": 0}, {"key": "e2847808e1990f51cd54eccd660640c44638f088", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.7201714948841595, "ground_truth": 0}, {"key": "e2847808e1990f51cd54eccd660640c44638f088", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.7577943615489968, "ground_truth": 0}, {"key": "e2847808e1990f51cd54eccd660640c44638f088", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.45907613697235733, "ground_truth": 0}, {"key": "e2847808e1990f51cd54eccd660640c44638f088", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.7556369881738553, "ground_truth": 0}, {"key": "fbc2d5f3f088eda2b8128ebb12a042850f6e4f3d", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.7772998523292991, "ground_truth": 0}, {"key": "fbc2d5f3f088eda2b8128ebb12a042850f6e4f3d", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.9260366259645304, "ground_truth": 0}, {"key": "fbc2d5f3f088eda2b8128ebb12a042850f6e4f3d", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.9102267066939124, "ground_truth": 0}, {"key": "fbc2d5f3f088eda2b8128ebb12a042850f6e4f3d", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.9626731138112742, "ground_truth": 0}, {"key": "fbc2d5f3f088eda2b8128ebb12a042850f6e4f3d", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.8868130877091327, "ground_truth": 0}, {"key": "6f0d219aba6227e0a69e71e7fca4b85ae761101d", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.048857782860077734, "ground_truth": 0}, {"key": "6f0d219aba6227e0a69e71e7fca4b85ae761101d", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.079782016163696, "ground_truth": 0}, {"key": "6f0d219aba6227e0a69e71e7fca4b85ae761101d", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.038178275935588216, "ground_truth": 0}, {"key": "6f0d219aba6227e0a69e71e7fca4b85ae761101d", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.12940273270393168, "ground_truth": 0}, {"key": "6f0d219aba6227e0a69e71e7fca4b85ae761101d", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.16559312374680354, "ground_truth": 0}, {"key": "8c71492f2a3fbe7eb9c8205d65054ab14c1dbdb6", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.32423538815914876, "ground_truth": 0}, {"key": "8c71492f2a3fbe7eb9c8205d65054ab14c1dbdb6", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.07159119904356484, "ground_truth": 0}, {"key": "8c71492f2a3fbe7eb9c8205d65054ab14c1dbdb6", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.23581158732322058, "ground_truth": 0}, {"key": "8c71492f2a3fbe7eb9c8205d65054ab14c1dbdb6", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.23440665011279774, "ground_truth": 0}, {"key": "8c71492f2a3fbe7eb9c8205d65054ab14c1dbdb6", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.2186693780190961, "ground_truth": 0}, {"key": "860cea3a6afb8527d26e9234ccba560a39eff2a7", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.20689405142662684, "ground_truth": 0}, {"key": "860cea3a6afb8527d26e9234ccba560a39eff2a7", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.09534946819934594, "ground_truth": 0}, {"key": "860cea3a6afb8527d26e9234ccba560a39eff2a7", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.21469142177542588, "ground_truth": 0}, {"key": "860cea3a6afb8527d26e9234ccba560a39eff2a7", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.12421300858157679, "ground_truth": 0}, {"key": "860cea3a6afb8527d26e9234ccba560a39eff2a7", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.08006926526925631, "ground_truth": 0}, {"key": "0914e3c80a676e14e225504cb759103503f3f1e0", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.05644402582253765, "ground_truth": 0}, {"key": "0914e3c80a676e14e225504cb759103503f3f1e0", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.06164962287346268, "ground_truth": 0}, {"key": "0914e3c80a676e14e225504cb759103503f3f1e0", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.0648901159073436, "ground_truth": 0}, {"key": "0914e3c80a676e14e225504cb759103503f3f1e0", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.12168574766541974, "ground_truth": 0}, {"key": "0914e3c80a676e14e225504cb759103503f3f1e0", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.05051766932047103, "ground_truth": 0}, {"key": "82a0e1f034174079179821b052f33df76c781b47", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.3684057206605667, "ground_truth": 0}, {"key": "82a0e1f034174079179821b052f33df76c781b47", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.3775406653613253, "ground_truth": 0}, {"key": "82a0e1f034174079179821b052f33df76c781b47", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.5428632685221526, "ground_truth": 0}, {"key": "82a0e1f034174079179821b052f33df76c781b47", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.6740504781967696, "ground_truth": 0}, {"key": "82a0e1f034174079179821b052f33df76c781b47", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.7872777436965348, "ground_truth": 0}, {"key": "449c536051eba7070b18a7b33ebcf024891cb913", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.9241418264623622, "ground_truth": 0}, {"key": "449c536051eba7070b18a7b33ebcf024891cb913", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.17781087963410813, "ground_truth": 0}, {"key": "449c536051eba7070b18a7b33ebcf024891cb913", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.7924642591152005, "ground_truth": 0}, {"key": "449c536051eba7070b18a7b33ebcf024891cb913", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.24653335490485817, "ground_truth": 0}, {"key": "449c536051eba7070b18a7b33ebcf024891cb913", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.5525397192841413, "ground_truth": 0}, {"key": "696d5716c42ab1096cdb464da3cfcf702626a62a", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.5774953769624794, "ground_truth": 0}, {"key": "696d5716c42ab1096cdb464da3cfcf702626a62a", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.4697635093612476, "ground_truth": 0}, {"key": "696d5716c42ab1096cdb464da3cfcf702626a62a", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.527316544627993, "ground_truth": 0}, {"key": "696d5716c42ab1096cdb464da3cfcf702626a62a", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.6361270720507904, "ground_truth": 0}, {"key": "696d5716c42ab1096cdb464da3cfcf702626a62a", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.7994423186311825, "ground_truth": 0}, {"key": "316f0f847800fdb547f7496f6095075cd610c7e4", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.9167080721308893, "ground_truth": 0}, {"key": "316f0f847800fdb547f7496f6095075cd610c7e4", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.6104534705119751, "ground_truth": 0}, {"key": "316f0f847800fdb547f7496f6095075cd610c7e4", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.6636689369975692, "ground_truth": 0}, {"key": "316f0f847800fdb547f7496f6095075cd610c7e4", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.7468782064216717, "ground_truth": 0}, {"key": "316f0f847800fdb547f7496f6095075cd610c7e4", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.7217431986359517, "ground_truth": 0}, {"key": "28e251ea722829df08d63e83824110fedcc13f8c", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.8494723714524121, "ground_truth": 0}, {"key": "28e251ea722829df08d63e83824110fedcc13f8c", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.3407044869763438, "ground_truth": 0}, {"key": "28e251ea722829df08d63e83824110fedcc13f8c", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.1456006371463823, "ground_truth": 0}, {"key": "28e251ea722829df08d63e83824110fedcc13f8c", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.16667540104725026, "ground_truth": 0}, {"key": "28e251ea722829df08d63e83824110fedcc13f8c", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.5117165976744745, "ground_truth": 0}, {"key": "4812698545d6a4c2243db340fad08d0b3b7fbe0b", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.8056321832784222, "ground_truth": 0}, {"key": "4812698545d6a4c2243db340fad08d0b3b7fbe0b", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.7008948017575378, "ground_truth": 0}, {"key": "4812698545d6a4c2243db340fad08d0b3b7fbe0b", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.39047582329537106, "ground_truth": 0}, {"key": "4812698545d6a4c2243db340fad08d0b3b7fbe0b", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.6057990399236439, "ground_truth": 0}, {"key": "4812698545d6a4c2243db340fad08d0b3b7fbe0b", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.433981474848482, "ground_truth": 0}, {"key": "81651fc015f2db10f24327d11b1a3748a19466f9", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.3380771510315616, "ground_truth": 0}, {"key": "81651fc015f2db10f24327d11b1a3748a19466f9", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.17667160766615325, "ground_truth": 0}, {"key": "81651fc015f2db10f24327d11b1a3748a19466f9", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.08819004219668208, "ground_truth": 0}, {"key": "81651fc015f2db10f24327d11b1a3748a19466f9", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.09041372408811602, "ground_truth": 0}, {"key": "81651fc015f2db10f24327d11b1a3748a19466f9", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.12765262391451826, "ground_truth": 0}, {"key": "f85e12129885fad0eabd6a1c6b6b24dbf8948db5", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.9304582589491305, "ground_truth": 0}, {"key": "f85e12129885fad0eabd6a1c6b6b24dbf8948db5", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.9756698094872257, "ground_truth": 0}, {"key": "f85e12129885fad0eabd6a1c6b6b24dbf8948db5", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.9626731137673175, "ground_truth": 0}, {"key": "f85e12129885fad0eabd6a1c6b6b24dbf8948db5", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.9346342163481729, "ground_truth": 0}, {"key": "f85e12129885fad0eabd6a1c6b6b24dbf8948db5", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.9341552986399155, "ground_truth": 0}, {"key": "bffa402002700855fec36f83c8c226dfe271a6af", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.05340332988473899, "ground_truth": 0}, {"key": "bffa402002700855fec36f83c8c226dfe271a6af", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.17667160423126949, "ground_truth": 0}, {"key": "bffa402002700855fec36f83c8c226dfe271a6af", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.09670579382040403, "ground_truth": 0}, {"key": "bffa402002700855fec36f83c8c226dfe271a6af", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.037186775952993606, "ground_truth": 0}, {"key": "bffa402002700855fec36f83c8c226dfe271a6af", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.20561504544789866, "ground_truth": 0}, {"key": "360df256327edcaf7ce0b99314adec8b0a2c5be6", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.4186969279436189, "ground_truth": 0}, {"key": "360df256327edcaf7ce0b99314adec8b0a2c5be6", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.7468781757731401, "ground_truth": 0}, {"key": "360df256327edcaf7ce0b99314adec8b0a2c5be6", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.6113819959071016, "ground_truth": 0}, {"key": "360df256327edcaf7ce0b99314adec8b0a2c5be6", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.16026603537152523, "ground_truth": 0}, {"key": "360df256327edcaf7ce0b99314adec8b0a2c5be6", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.4765796550336628, "ground_truth": 0}, {"key": "35ae4229bbd571d86bb817df03b3784dc8cbf660", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.06828854082055222, "ground_truth": 0}, {"key": "35ae4229bbd571d86bb817df03b3784dc8cbf660", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.12678517164421496, "ground_truth": 0}, {"key": "35ae4229bbd571d86bb817df03b3784dc8cbf660", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.14903529691260772, "ground_truth": 0}, {"key": "35ae4229bbd571d86bb817df03b3784dc8cbf660", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.12294379610830954, "ground_truth": 0}, {"key": "35ae4229bbd571d86bb817df03b3784dc8cbf660", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.14080818236428766, "ground_truth": 0}, {"key": "fd93b423a3805de1c259d527393fd5fb75d06a55", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.4610167796413226, "ground_truth": 0}, {"key": "fd93b423a3805de1c259d527393fd5fb75d06a55", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.813460780257908, "ground_truth": 0}, {"key": "fd93b423a3805de1c259d527393fd5fb75d06a55", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.8193157790680842, "ground_truth": 0}, {"key": "fd93b423a3805de1c259d527393fd5fb75d06a55", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.8397339717687726, "ground_truth": 0}, {"key": "fd93b423a3805de1c259d527393fd5fb75d06a55", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.8852352193732025, "ground_truth": 0}, {"key": "646676aabe72e75add3cde2d6afa56cea64c91a4", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.031738590686111394, "ground_truth": 0}, {"key": "646676aabe72e75add3cde2d6afa56cea64c91a4", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.03861093068287802, "ground_truth": 0}, {"key": "646676aabe72e75add3cde2d6afa56cea64c91a4", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.2643583672575279, "ground_truth": 0}, {"key": "646676aabe72e75add3cde2d6afa56cea64c91a4", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.18476750721698296, "ground_truth": 0}, {"key": "646676aabe72e75add3cde2d6afa56cea64c91a4", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.01652955682717832, "ground_truth": 0}, {"key": "5acf12b2ef7771fd1cd1421acb7057d9a64be818", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.3040416838261689, "ground_truth": 0}, {"key": "5acf12b2ef7771fd1cd1421acb7057d9a64be818", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.14953138624970358, "ground_truth": 0}, {"key": "5acf12b2ef7771fd1cd1421acb7057d9a64be818", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.11757214020653757, "ground_truth": 0}, {"key": "5acf12b2ef7771fd1cd1421acb7057d9a64be818", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.06301946776862612, "ground_truth": 0}, {"key": "5acf12b2ef7771fd1cd1421acb7057d9a64be818", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.15102780704940794, "ground_truth": 0}, {"key": "0239342f05436085947bd0c5173a4636ee772b51", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.12002562145569881, "ground_truth": 0}, {"key": "0239342f05436085947bd0c5173a4636ee772b51", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.19072402023902113, "ground_truth": 0}, {"key": "0239342f05436085947bd0c5173a4636ee772b51", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.1666754012310038, "ground_truth": 0}, {"key": "0239342f05436085947bd0c5173a4636ee772b51", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.19559408066617745, "ground_truth": 0}, {"key": "0239342f05436085947bd0c5173a4636ee772b51", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.20689404382521126, "ground_truth": 0}, {"key": "1f40e358077ff22078a4e91e5114c4f86a4d52db", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.25683199927303074, "ground_truth": 0}, {"key": "1f40e358077ff22078a4e91e5114c4f86a4d52db", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.5832033554281353, "ground_truth": 0}, {"key": "1f40e358077ff22078a4e91e5114c4f86a4d52db", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.5602526709442692, "ground_truth": 0}, {"key": "1f40e358077ff22078a4e91e5114c4f86a4d52db", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.3998116452322143, "ground_truth": 0}, {"key": "1f40e358077ff22078a4e91e5114c4f86a4d52db", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.3398276359344112, "ground_truth": 0}, {"key": "a8ac682f29acaad4b669781c39fb2804374b8b2b", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.03283695633444553, "ground_truth": 0}, {"key": "a8ac682f29acaad4b669781c39fb2804374b8b2b", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.023509450866105407, "ground_truth": 0}, {"key": "a8ac682f29acaad4b669781c39fb2804374b8b2b", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.12506538397684963, "ground_truth": 0}, {"key": "a8ac682f29acaad4b669781c39fb2804374b8b2b", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.05964694162577354, "ground_truth": 0}, {"key": "a8ac682f29acaad4b669781c39fb2804374b8b2b", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.008985428818187438, "ground_truth": 0}, {"key": "d4474ce9da725c1540ac826f3247f53d086808fb", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.02931223054251531, "ground_truth": 0}, {"key": "d4474ce9da725c1540ac826f3247f53d086808fb", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.016529557421097137, "ground_truth": 0}, {"key": "d4474ce9da725c1540ac826f3247f53d086808fb", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.18713268343270326, "ground_truth": 0}, {"key": "d4474ce9da725c1540ac826f3247f53d086808fb", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.029535337072500008, "ground_truth": 0}, {"key": "d4474ce9da725c1540ac826f3247f53d086808fb", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.008315779172970085, "ground_truth": 0}, {"key": "e74db6d20c456740ecb7b295c8d24489fb4f436f", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.5389832063509475, "ground_truth": 0}, {"key": "e74db6d20c456740ecb7b295c8d24489fb4f436f", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.3115315670911578, "ground_truth": 0}, {"key": "e74db6d20c456740ecb7b295c8d24489fb4f436f", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.544801378282073, "ground_truth": 0}, {"key": "e74db6d20c456740ecb7b295c8d24489fb4f436f", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.2628418469223193, "ground_truth": 0}, {"key": "e74db6d20c456740ecb7b295c8d24489fb4f436f", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.4765796465275539, "ground_truth": 0}, {"key": "d79b790edcc3f5088161445102a656ae4adb8ab1", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.611381976494196, "ground_truth": 0}, {"key": "d79b790edcc3f5088161445102a656ae4adb8ab1", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.40733340174778515, "ground_truth": 0}, {"key": "d79b790edcc3f5088161445102a656ae4adb8ab1", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.37296187077143095, "ground_truth": 0}, {"key": "d79b790edcc3f5088161445102a656ae4adb8ab1", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.613236573049944, "ground_truth": 0}, {"key": "d79b790edcc3f5088161445102a656ae4adb8ab1", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.6842640454079862, "ground_truth": 0}, {"key": "47f028dbf53e028eb6636c85d8b3ee0de6a1de7b", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.029090755977324235, "ground_truth": 0}, {"key": "47f028dbf53e028eb6636c85d8b3ee0de6a1de7b", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.015663649243094775, "ground_truth": 0}, {"key": "47f028dbf53e028eb6636c85d8b3ee0de6a1de7b", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.012821214973755608, "ground_truth": 0}, {"key": "47f028dbf53e028eb6636c85d8b3ee0de6a1de7b", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.004086002534194816, "ground_truth": 0}, {"key": "47f028dbf53e028eb6636c85d8b3ee0de6a1de7b", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.009596454462292795, "ground_truth": 0}, {"key": "5f7a869908e864b70e83282b289ed1274c1f7f0d", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.23091974239589735, "ground_truth": 0}, {"key": "5f7a869908e864b70e83282b289ed1274c1f7f0d", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.21866936755133404, "ground_truth": 0}, {"key": "5f7a869908e864b70e83282b289ed1274c1f7f0d", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.3090237099403307, "ground_truth": 0}, {"key": "5f7a869908e864b70e83282b289ed1274c1f7f0d", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.15610490835897256, "ground_truth": 0}, {"key": "5f7a869908e864b70e83282b289ed1274c1f7f0d", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.4263215701169305, "ground_truth": 0}, {"key": "59a9e7cad1c4c873738dda62b7e7b39bc2553710", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.17161580387277892, "ground_truth": 0}, {"key": "59a9e7cad1c4c873738dda62b7e7b39bc2553710", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.030444350078242026, "ground_truth": 0}, {"key": "59a9e7cad1c4c873738dda62b7e7b39bc2553710", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.16885695672671014, "ground_truth": 0}, {"key": "59a9e7cad1c4c873738dda62b7e7b39bc2553710", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.2186693698854366, "ground_truth": 0}, {"key": "59a9e7cad1c4c873738dda62b7e7b39bc2553710", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.09807931927225823, "ground_truth": 0}, {"key": "c47db89f5f9de3e599e2947ab7940eb65be0b433", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.15817434903040137, "ground_truth": 0}, {"key": "c47db89f5f9de3e599e2947ab7940eb65be0b433", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.14414885017880041, "ground_truth": 0}, {"key": "c47db89f5f9de3e599e2947ab7940eb65be0b433", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.10743747295998275, "ground_truth": 0}, {"key": "c47db89f5f9de3e599e2947ab7940eb65be0b433", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.0973904039335765, "ground_truth": 0}, {"key": "c47db89f5f9de3e599e2947ab7940eb65be0b433", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.1540575590589243, "ground_truth": 0}, {"key": "a74c3ff540cb154fc1294fd9d48b6a952329722b", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.782662485107089, "ground_truth": 0}, {"key": "a74c3ff540cb154fc1294fd9d48b6a952329722b", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.9481545333057266, "ground_truth": 0}, {"key": "a74c3ff540cb154fc1294fd9d48b6a952329722b", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.9403530602646215, "ground_truth": 0}, {"key": "a74c3ff540cb154fc1294fd9d48b6a952329722b", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.9471859749183492, "ground_truth": 0}, {"key": "a74c3ff540cb154fc1294fd9d48b6a952329722b", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.9585377264640256, "ground_truth": 0}, {"key": "f5692f8e01389a631dadcb70cfd4be3ff0ae45d3", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.029090757086395597, "ground_truth": 0}, {"key": "f5692f8e01389a631dadcb70cfd4be3ff0ae45d3", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.07004896313093785, "ground_truth": 0}, {"key": "f5692f8e01389a631dadcb70cfd4be3ff0ae45d3", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.03817827654100154, "ground_truth": 0}, {"key": "f5692f8e01389a631dadcb70cfd4be3ff0ae45d3", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.09203286809346553, "ground_truth": 0}, {"key": "f5692f8e01389a631dadcb70cfd4be3ff0ae45d3", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.09739039455306134, "ground_truth": 0}, {"key": "467e1b592518a5660d0a3b7eda24ef9574fe0d11", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.10894503544732306, "ground_truth": 0}, {"key": "467e1b592518a5660d0a3b7eda24ef9574fe0d11", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.2295352093543275, "ground_truth": 0}, {"key": "467e1b592518a5660d0a3b7eda24ef9574fe0d11", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.16559312153555145, "ground_truth": 0}, {"key": "467e1b592518a5660d0a3b7eda24ef9574fe0d11", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.22405546226053866, "ground_truth": 0}, {"key": "467e1b592518a5660d0a3b7eda24ef9574fe0d11", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.18359363028885958, "ground_truth": 0}, {"key": "61acf6de75325370728f6e290bafb01adc24a3ca", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.0568615523146258, "ground_truth": 0}, {"key": "61acf6de75325370728f6e290bafb01adc24a3ca", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.07807816115618615, "ground_truth": 0}, {"key": "61acf6de75325370728f6e290bafb01adc24a3ca", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.20055767259214077, "ground_truth": 0}, {"key": "61acf6de75325370728f6e290bafb01adc24a3ca", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.028007520966782128, "ground_truth": 0}, {"key": "61acf6de75325370728f6e290bafb01adc24a3ca", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.13939637721601816, "ground_truth": 0}, {"key": "172d2668b011501c20181b4925ebb6ba582f9a2f", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.17328820643219417, "ground_truth": 0}, {"key": "172d2668b011501c20181b4925ebb6ba582f9a2f", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.1655931256501657, "ground_truth": 0}, {"key": "172d2668b011501c20181b4925ebb6ba582f9a2f", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.20055768910098754, "ground_truth": 0}, {"key": "172d2668b011501c20181b4925ebb6ba582f9a2f", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.14128142023495727, "ground_truth": 0}, {"key": "172d2668b011501c20181b4925ebb6ba582f9a2f", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.4320633830061425, "ground_truth": 0}, {"key": "314c7c0104eb4113074619b3b3f1e9356114e2f5", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.800067883518885, "ground_truth": 0}, {"key": "314c7c0104eb4113074619b3b3f1e9356114e2f5", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.4301473425268176, "ground_truth": 0}, {"key": "314c7c0104eb4113074619b3b3f1e9356114e2f5", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.19559408167968403, "ground_truth": 0}, {"key": "314c7c0104eb4113074619b3b3f1e9356114e2f5", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.8316905595471709, "ground_truth": 0}, {"key": "314c7c0104eb4113074619b3b3f1e9356114e2f5", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.66627966963095, "ground_truth": 0}, {"key": "e66546893c2fa5fe38be74e1d1ed104f0c412b4d", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.07055959720226161, "ground_truth": 0}, {"key": "e66546893c2fa5fe38be74e1d1ed104f0c412b4d", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.06903792992015996, "ground_truth": 0}, {"key": "e66546893c2fa5fe38be74e1d1ed104f0c412b4d", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.06903792908221107, "ground_truth": 0}, {"key": "e66546893c2fa5fe38be74e1d1ed104f0c412b4d", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.11757213764457657, "ground_truth": 0}, {"key": "e66546893c2fa5fe38be74e1d1ed104f0c412b4d", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.13939637854317066, "ground_truth": 0}, {"key": "04882672036936ca86bdebed819a133539cbd296", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.10447731820120051, "ground_truth": 0}, {"key": "04882672036936ca86bdebed819a133539cbd296", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.14804718235597394, "ground_truth": 0}, {"key": "04882672036936ca86bdebed819a133539cbd296", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.04795810290194325, "ground_truth": 0}, {"key": "04882672036936ca86bdebed819a133539cbd296", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.20561504395272892, "ground_truth": 0}, {"key": "04882672036936ca86bdebed819a133539cbd296", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.1044773248721918, "ground_truth": 0}, {"key": "d5342fb6d8d522f336f2ce34eaa6e62446c0da2e", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.026155619653477114, "ground_truth": 0}, {"key": "d5342fb6d8d522f336f2ce34eaa6e62446c0da2e", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.025760559722282885, "ground_truth": 0}, {"key": "d5342fb6d8d522f336f2ce34eaa6e62446c0da2e", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.06804042098155118, "ground_truth": 0}, {"key": "d5342fb6d8d522f336f2ce34eaa6e62446c0da2e", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.014957086521321387, "ground_truth": 0}, {"key": "d5342fb6d8d522f336f2ce34eaa6e62446c0da2e", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.15405755818754083, "ground_truth": 0}, {"key": "87cdc5b797032387ea9bd0c9a0d7fd57c088e65b", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.4765796558809842, "ground_truth": 0}, {"key": "87cdc5b797032387ea9bd0c9a0d7fd57c088e65b", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.20689405118096477, "ground_truth": 0}, {"key": "87cdc5b797032387ea9bd0c9a0d7fd57c088e65b", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.577495388302326, "ground_truth": 0}, {"key": "87cdc5b797032387ea9bd0c9a0d7fd57c088e65b", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.42155181787074236, "ground_truth": 0}, {"key": "87cdc5b797032387ea9bd0c9a0d7fd57c088e65b", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.21601152930781872, "ground_truth": 0}, {"key": "4fd3285b643696cd49f08c14b0d482e559f32eed", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.03890198102982743, "ground_truth": 0}, {"key": "4fd3285b643696cd49f08c14b0d482e559f32eed", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.04535258045074675, "ground_truth": 0}, {"key": "4fd3285b643696cd49f08c14b0d482e559f32eed", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.020332352083698203, "ground_truth": 0}, {"key": "4fd3285b643696cd49f08c14b0d482e559f32eed", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.02017731975980667, "ground_truth": 0}, {"key": "4fd3285b643696cd49f08c14b0d482e559f32eed", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.017509556092132325, "ground_truth": 0}, {"key": "55930649e6f3cb285a26ef33525f8199bd86d089", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.08694165825989887, "ground_truth": 0}, {"key": "55930649e6f3cb285a26ef33525f8199bd86d089", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.34864514397642243, "ground_truth": 0}, {"key": "55930649e6f3cb285a26ef33525f8199bd86d089", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.2909808621423386, "ground_truth": 0}, {"key": "55930649e6f3cb285a26ef33525f8199bd86d089", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.21076629645206926, "ground_truth": 0}, {"key": "55930649e6f3cb285a26ef33525f8199bd86d089", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.3174262609340888, "ground_truth": 0}, {"key": "8b1c9d7c48a0d857ae857a21395a4996de051915", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.05460060672021526, "ground_truth": 0}, {"key": "8b1c9d7c48a0d857ae857a21395a4996de051915", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.1451153582459944, "ground_truth": 0}, {"key": "8b1c9d7c48a0d857ae857a21395a4996de051915", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.6671476699968568, "ground_truth": 0}, {"key": "8b1c9d7c48a0d857ae857a21395a4996de051915", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.02737648977304179, "ground_truth": 0}, {"key": "8b1c9d7c48a0d857ae857a21395a4996de051915", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.16238002530214968, "ground_truth": 0}, {"key": "d95dce003f0fccc57742bd900c81897c45208c10", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.0697949201265411, "ground_truth": 0}, {"key": "d95dce003f0fccc57742bd900c81897c45208c10", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.11436852916398367, "ground_truth": 0}, {"key": "d95dce003f0fccc57742bd900c81897c45208c10", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.14223189384995294, "ground_truth": 0}, {"key": "d95dce003f0fccc57742bd900c81897c45208c10", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.1338674878151086, "ground_truth": 0}, {"key": "d95dce003f0fccc57742bd900c81897c45208c10", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.10087861435421576, "ground_truth": 0}, {"key": "f732a658c314c090257225483075e4d9fde28b95", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.5774953741788442, "ground_truth": 0}, {"key": "f732a658c314c090257225483075e4d9fde28b95", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.46101679115084676, "ground_truth": 0}, {"key": "f732a658c314c090257225483075e4d9fde28b95", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.18594720988834407, "ground_truth": 0}, {"key": "f732a658c314c090257225483075e4d9fde28b95", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.5851011671561974, "ground_truth": 0}, {"key": "f732a658c314c090257225483075e4d9fde28b95", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.18010665890493224, "ground_truth": 0}, {"key": "cbd21ed724b7e4a075ab4ae9a45d9e86d6151283", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.4436004088767047, "ground_truth": 0}, {"key": "cbd21ed724b7e4a075ab4ae9a45d9e86d6151283", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.5926666046831277, "ground_truth": 0}, {"key": "cbd21ed724b7e4a075ab4ae9a45d9e86d6151283", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.4493926587332026, "ground_truth": 0}, {"key": "cbd21ed724b7e4a075ab4ae9a45d9e86d6151283", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.5602526632188812, "ground_truth": 0}, {"key": "cbd21ed724b7e4a075ab4ae9a45d9e86d6151283", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.5544704613571545, "ground_truth": 0}, {"key": "4a32d5f29cfb35f3a3966ee041fc1f358503f4b4", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.07978201383719753, "ground_truth": 0}, {"key": "4a32d5f29cfb35f3a3966ee041fc1f358503f4b4", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.3451052788665038, "ground_truth": 0}, {"key": "4a32d5f29cfb35f3a3966ee041fc1f358503f4b4", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.22541661170829855, "ground_truth": 0}, {"key": "4a32d5f29cfb35f3a3966ee041fc1f358503f4b4", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.2689414476227343, "ground_truth": 0}, {"key": "4a32d5f29cfb35f3a3966ee041fc1f358503f4b4", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.26435837180171484, "ground_truth": 0}, {"key": "d470c9860671ae720ccc7df115a46d471b4b900a", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.6406358506573342, "ground_truth": 0}, {"key": "d470c9860671ae720ccc7df115a46d471b4b900a", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.8233283926056877, "ground_truth": 0}, {"key": "d470c9860671ae720ccc7df115a46d471b4b900a", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.7461389895017854, "ground_truth": 0}, {"key": "d470c9860671ae720ccc7df115a46d471b4b900a", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.36477758633626195, "ground_truth": 0}, {"key": "d470c9860671ae720ccc7df115a46d471b4b900a", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.5019531277882827, "ground_truth": 0}, {"key": "55327ce32c4d5168e8e0fa7b5dabc9a8aafd9d78", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.07477004668532254, "ground_truth": 0}, {"key": "55327ce32c4d5168e8e0fa7b5dabc9a8aafd9d78", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.09602549649085841, "ground_truth": 0}, {"key": "55327ce32c4d5168e8e0fa7b5dabc9a8aafd9d78", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.13477591953680823, "ground_truth": 0}, {"key": "55327ce32c4d5168e8e0fa7b5dabc9a8aafd9d78", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.345105287018537, "ground_truth": 0}, {"key": "55327ce32c4d5168e8e0fa7b5dabc9a8aafd9d78", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.048857781105815574, "ground_truth": 0}, {"key": "022c18def42072e28a37979c622c6ab7e31371de", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.09009299713302445, "ground_truth": 0}, {"key": "022c18def42072e28a37979c622c6ab7e31371de", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.11838509789812188, "ground_truth": 0}, {"key": "022c18def42072e28a37979c622c6ab7e31371de", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.10447732455698064, "ground_truth": 0}, {"key": "022c18def42072e28a37979c622c6ab7e31371de", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.16776334560216774, "ground_truth": 0}, {"key": "022c18def42072e28a37979c622c6ab7e31371de", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.2005576747124165, "ground_truth": 0}, {"key": "d49c8ddc7586fcc27a7d310a5cb7703f19e4607d", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.11676401035094873, "ground_truth": 0}, {"key": "d49c8ddc7586fcc27a7d310a5cb7703f19e4607d", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.24508500346157083, "ground_truth": 0}, {"key": "d49c8ddc7586fcc27a7d310a5cb7703f19e4607d", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.16559312447730767, "ground_truth": 0}, {"key": "d49c8ddc7586fcc27a7d310a5cb7703f19e4607d", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.10302442915729236, "ground_truth": 0}, {"key": "d49c8ddc7586fcc27a7d310a5cb7703f19e4607d", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.39047583809941616, "ground_truth": 0}, {"key": "bda116dccb075585a67fd5dd5b759015c7577eb0", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.28298811696452747, "ground_truth": 0}, {"key": "bda116dccb075585a67fd5dd5b759015c7577eb0", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.01652955769057665, "ground_truth": 0}, {"key": "bda116dccb075585a67fd5dd5b759015c7577eb0", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.08570927596220941, "ground_truth": 0}, {"key": "bda116dccb075585a67fd5dd5b759015c7577eb0", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.0338440320440635, "ground_truth": 0}, {"key": "bda116dccb075585a67fd5dd5b759015c7577eb0", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.3557748668911014, "ground_truth": 0}, {"key": "ee0b1bc5ee40697c0792e3906000fe8be5be182a", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.19436782342642842, "ground_truth": 0}, {"key": "ee0b1bc5ee40697c0792e3906000fe8be5be182a", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.07263670727107924, "ground_truth": 0}, {"key": "ee0b1bc5ee40697c0792e3906000fe8be5be182a", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.3191213886464942, "ground_truth": 0}, {"key": "ee0b1bc5ee40697c0792e3906000fe8be5be182a", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.13296424532101386, "ground_truth": 0}, {"key": "ee0b1bc5ee40697c0792e3906000fe8be5be182a", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.13753246901224, "ground_truth": 0}, {"key": "75b0d4c21581a1b0c1fc5798adba334d8ecc34f3", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.4436004235330731, "ground_truth": 0}, {"key": "75b0d4c21581a1b0c1fc5798adba334d8ecc34f3", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.7217431987675554, "ground_truth": 0}, {"key": "75b0d4c21581a1b0c1fc5798adba334d8ecc34f3", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.6187804445460536, "ground_truth": 0}, {"key": "75b0d4c21581a1b0c1fc5798adba334d8ecc34f3", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.2200071103661012, "ground_truth": 0}, {"key": "75b0d4c21581a1b0c1fc5798adba334d8ecc34f3", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.25238404689062965, "ground_truth": 0}, {"key": "3f7e19cffef13f356e2298c5a63e6c8db20f3d91", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.03817827458218573, "ground_truth": 0}, {"key": "3f7e19cffef13f356e2298c5a63e6c8db20f3d91", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.09138210664709799, "ground_truth": 0}, {"key": "3f7e19cffef13f356e2298c5a63e6c8db20f3d91", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.13206615499116547, "ground_truth": 0}, {"key": "3f7e19cffef13f356e2298c5a63e6c8db20f3d91", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.1795305604990822, "ground_truth": 0}, {"key": "3f7e19cffef13f356e2298c5a63e6c8db20f3d91", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.09807932571708079, "ground_truth": 0}, {"key": "00359f516cdf8b1800c7102711bd9aa400d1c749", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.7859664254201986, "ground_truth": 0}, {"key": "00359f516cdf8b1800c7102711bd9aa400d1c749", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.680878619745569, "ground_truth": 0}, {"key": "00359f516cdf8b1800c7102711bd9aa400d1c749", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.4474603043775995, "ground_truth": 0}, {"key": "00359f516cdf8b1800c7102711bd9aa400d1c749", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.07343005012493098, "ground_truth": 0}, {"key": "00359f516cdf8b1800c7102711bd9aa400d1c749", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.859191820783229, "ground_truth": 0}, {"key": "f8be2f5ce06cb4af91cbb7b6bef9835991751ef5", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.20307462887912806, "ground_truth": 0}, {"key": "f8be2f5ce06cb4af91cbb7b6bef9835991751ef5", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.09334687497016844, "ground_truth": 0}, {"key": "f8be2f5ce06cb4af91cbb7b6bef9835991751ef5", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.09807932613109874, "ground_truth": 0}, {"key": "f8be2f5ce06cb4af91cbb7b6bef9835991751ef5", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.07237401965217943, "ground_truth": 0}, {"key": "f8be2f5ce06cb4af91cbb7b6bef9835991751ef5", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.19930800162406745, "ground_truth": 0}, {"key": "958a67b8550998886478275b404e2256a6b85c7c", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.2538610118786586, "ground_truth": 0}, {"key": "958a67b8550998886478275b404e2256a6b85c7c", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.294214981661845, "ground_truth": 0}, {"key": "958a67b8550998886478275b404e2256a6b85c7c", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.184767513041165, "ground_truth": 0}, {"key": "958a67b8550998886478275b404e2256a6b85c7c", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.2538610242855353, "ground_truth": 0}, {"key": "958a67b8550998886478275b404e2256a6b85c7c", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.10970577252301887, "ground_truth": 0}, {"key": "4739f160c87994f52e894591194f5df06fed4c39", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.11838510334266185, "ground_truth": 0}, {"key": "4739f160c87994f52e894591194f5df06fed4c39", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.19806418066771317, "ground_truth": 0}, {"key": "4739f160c87994f52e894591194f5df06fed4c39", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.10447731621661215, "ground_truth": 0}, {"key": "4739f160c87994f52e894591194f5df06fed4c39", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.1592173981117915, "ground_truth": 0}, {"key": "4739f160c87994f52e894591194f5df06fed4c39", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.05261895469860216, "ground_truth": 0}, {"key": "027a99a889b38fdb935cd14c204a5fca8a329bc1", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.02615561886582877, "ground_truth": 0}, {"key": "027a99a889b38fdb935cd14c204a5fca8a329bc1", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.01678549098039796, "ground_truth": 0}, {"key": "027a99a889b38fdb935cd14c204a5fca8a329bc1", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.013222821931558514, "ground_truth": 0}, {"key": "027a99a889b38fdb935cd14c204a5fca8a329bc1", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.0894545975645631, "ground_truth": 0}, {"key": "027a99a889b38fdb935cd14c204a5fca8a329bc1", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.0570714011925198, "ground_truth": 0}, {"key": "c7c83a9ee902e568a55898c616f20181952ce057", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.2133771677502114, "ground_truth": 0}, {"key": "c7c83a9ee902e568a55898c616f20181952ce057", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.14223188739032716, "ground_truth": 0}, {"key": "c7c83a9ee902e568a55898c616f20181952ce057", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.13568954677711184, "ground_truth": 0}, {"key": "c7c83a9ee902e568a55898c616f20181952ce057", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.08725224759285946, "ground_truth": 0}, {"key": "c7c83a9ee902e568a55898c616f20181952ce057", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.2643583565166038, "ground_truth": 0}, {"key": "7bff6a60ff0b62855bd28562bb820233c0c940e0", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.2643583712735989, "ground_truth": 0}, {"key": "7bff6a60ff0b62855bd28562bb820233c0c940e0", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.1343210561855211, "ground_truth": 0}, {"key": "7bff6a60ff0b62855bd28562bb820233c0c940e0", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.17497346176212555, "ground_truth": 0}, {"key": "7bff6a60ff0b62855bd28562bb820233c0c940e0", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.05089371959983685, "ground_truth": 0}, {"key": "7bff6a60ff0b62855bd28562bb820233c0c940e0", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.07316471414849791, "ground_truth": 0}, {"key": "5ba5e49e25610f42416b2e7ba76d7496acab0f78", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.13117322808189075, "ground_truth": 0}, {"key": "5ba5e49e25610f42416b2e7ba76d7496acab0f78", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.18359362671102228, "ground_truth": 0}, {"key": "5ba5e49e25610f42416b2e7ba76d7496acab0f78", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.20817892412854458, "ground_truth": 0}, {"key": "5ba5e49e25610f42416b2e7ba76d7496acab0f78", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.29910518599546465, "ground_truth": 0}, {"key": "5ba5e49e25610f42416b2e7ba76d7496acab0f78", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.2094696809571435, "ground_truth": 0}, {"key": "0961a6a9fef7ad978ab866a57415578a49ba187f", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.28140559959856026, "ground_truth": 0}, {"key": "0961a6a9fef7ad978ab866a57415578a49ba187f", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.4111108694596776, "ground_truth": 0}, {"key": "0961a6a9fef7ad978ab866a57415578a49ba187f", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.06560483386077517, "ground_truth": 0}, {"key": "0961a6a9fef7ad978ab866a57415578a49ba187f", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.29910519459333595, "ground_truth": 0}, {"key": "0961a6a9fef7ad978ab866a57415578a49ba187f", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.30985844573131793, "ground_truth": 0}, {"key": "94148575d23050ffbedb00bddbd826d7137a4fe4", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.17441027155427977, "ground_truth": 0}, {"key": "94148575d23050ffbedb00bddbd826d7137a4fe4", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.06325052527848332, "ground_truth": 0}, {"key": "94148575d23050ffbedb00bddbd826d7137a4fe4", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.13028542675482696, "ground_truth": 0}, {"key": "94148575d23050ffbedb00bddbd826d7137a4fe4", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.09670578834849275, "ground_truth": 0}, {"key": "94148575d23050ffbedb00bddbd826d7137a4fe4", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.24653334515656822, "ground_truth": 0}, {"key": "aaa346e0be1ef1b9c2ce152c859b30e364ea3bc0", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.23091975421551608, "ground_truth": 0}, {"key": "aaa346e0be1ef1b9c2ce152c859b30e364ea3bc0", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.15817434733885807, "ground_truth": 0}, {"key": "aaa346e0be1ef1b9c2ce152c859b30e364ea3bc0", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.1688569571101535, "ground_truth": 0}, {"key": "aaa346e0be1ef1b9c2ce152c859b30e364ea3bc0", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.13477591782517565, "ground_truth": 0}, {"key": "aaa346e0be1ef1b9c2ce152c859b30e364ea3bc0", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.20561505477335212, "ground_truth": 0}, {"key": "7604af04967436c4aaf0c7df8b09afcec82f5be0", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.18476751206229067, "ground_truth": 0}, {"key": "7604af04967436c4aaf0c7df8b09afcec82f5be0", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.09670579278722728, "ground_truth": 0}, {"key": "7604af04967436c4aaf0c7df8b09afcec82f5be0", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.11838509924162441, "ground_truth": 0}, {"key": "7604af04967436c4aaf0c7df8b09afcec82f5be0", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.08329193206280651, "ground_truth": 0}, {"key": "7604af04967436c4aaf0c7df8b09afcec82f5be0", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.10521052993020402, "ground_truth": 0}, {"key": "1be68b94413120c0b2c7514ffd14b9cfc4413f90", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.04401865283946349, "ground_truth": 0}, {"key": "1be68b94413120c0b2c7514ffd14b9cfc4413f90", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.38954652831920666, "ground_truth": 0}, {"key": "1be68b94413120c0b2c7514ffd14b9cfc4413f90", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.7962924515778651, "ground_truth": 0}, {"key": "1be68b94413120c0b2c7514ffd14b9cfc4413f90", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.5679366024971044, "ground_truth": 0}, {"key": "1be68b94413120c0b2c7514ffd14b9cfc4413f90", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.7090191414323515, "ground_truth": 0}, {"key": "44fc3a2bc441a674f1ebdeabae73278977909db4", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.03567855414928347, "ground_truth": 0}, {"key": "44fc3a2bc441a674f1ebdeabae73278977909db4", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.019568675754002056, "ground_truth": 0}, {"key": "44fc3a2bc441a674f1ebdeabae73278977909db4", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.03789242553745183, "ground_truth": 0}, {"key": "44fc3a2bc441a674f1ebdeabae73278977909db4", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.030444349696529087, "ground_truth": 0}, {"key": "44fc3a2bc441a674f1ebdeabae73278977909db4", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.024237633720512908, "ground_truth": 0}, {"key": "fbb06b75e3963c5a810c9f73e4dc5382fbcb7405", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.5370413774519474, "ground_truth": 0}, {"key": "fbb06b75e3963c5a810c9f73e4dc5382fbcb7405", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.26133093272335023, "ground_truth": 0}, {"key": "fbb06b75e3963c5a810c9f73e4dc5382fbcb7405", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.17328821395260702, "ground_truth": 0}, {"key": "fbb06b75e3963c5a810c9f73e4dc5382fbcb7405", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.22815650748578659, "ground_truth": 0}, {"key": "fbb06b75e3963c5a810c9f73e4dc5382fbcb7405", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.7008948076116855, "ground_truth": 0}, {"key": "551839469c1133ef4697ed435c5de192e6076858", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.28616925470332977, "ground_truth": 0}, {"key": "551839469c1133ef4697ed435c5de192e6076858", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.2337063446631049, "ground_truth": 0}, {"key": "551839469c1133ef4697ed435c5de192e6076858", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.06119923021577796, "ground_truth": 0}, {"key": "551839469c1133ef4697ed435c5de192e6076858", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.2351083918089908, "ground_truth": 0}, {"key": "551839469c1133ef4697ed435c5de192e6076858", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.14903530594526965, "ground_truth": 0}, {"key": "386e149797954c4b5cd52bcad0beece29f7eb04a", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.15002882327291286, "ground_truth": 0}, {"key": "386e149797954c4b5cd52bcad0beece29f7eb04a", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.09073548597051086, "ground_truth": 0}, {"key": "386e149797954c4b5cd52bcad0beece29f7eb04a", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.22135069836902727, "ground_truth": 0}, {"key": "386e149797954c4b5cd52bcad0beece29f7eb04a", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.16184942243300443, "ground_truth": 0}, {"key": "386e149797954c4b5cd52bcad0beece29f7eb04a", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.21733751597544498, "ground_truth": 0}, {"key": "25abfd6bf83eb62bdd4daf1f542d61b54ab2871d", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.017309096372770272, "ground_truth": 0}, {"key": "25abfd6bf83eb62bdd4daf1f542d61b54ab2871d", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.030329261282681097, "ground_truth": 0}, {"key": "25abfd6bf83eb62bdd4daf1f542d61b54ab2871d", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.01791734390633348, "ground_truth": 0}, {"key": "25abfd6bf83eb62bdd4daf1f542d61b54ab2871d", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.03358950775446021, "ground_truth": 0}, {"key": "25abfd6bf83eb62bdd4daf1f542d61b54ab2871d", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.014447851956923951, "ground_truth": 0}, {"key": "e5e0f9ea6381d513d4632644634d7c12e1c6c4cb", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.30239108145960153, "ground_truth": 0}, {"key": "e5e0f9ea6381d513d4632644634d7c12e1c6c4cb", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.22541660554529422, "ground_truth": 0}, {"key": "e5e0f9ea6381d513d4632644634d7c12e1c6c4cb", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.33111974891510754, "ground_truth": 0}, {"key": "e5e0f9ea6381d513d4632644634d7c12e1c6c4cb", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.24798744020777613, "ground_truth": 0}, {"key": "e5e0f9ea6381d513d4632644634d7c12e1c6c4cb", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.39606816095348213, "ground_truth": 0}, {"key": "4e660c57fb36c03622b3ff9f9d0e78a0f7b0aea9", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.25091278698032843, "ground_truth": 0}, {"key": "4e660c57fb36c03622b3ff9f9d0e78a0f7b0aea9", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.08509904399156783, "ground_truth": 0}, {"key": "4e660c57fb36c03622b3ff9f9d0e78a0f7b0aea9", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.041930526191944435, "ground_truth": 0}, {"key": "4e660c57fb36c03622b3ff9f9d0e78a0f7b0aea9", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.09773431548220698, "ground_truth": 0}, {"key": "4e660c57fb36c03622b3ff9f9d0e78a0f7b0aea9", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.08945460544966534, "ground_truth": 0}, {"key": "586458cf89c9c2ddc5a7925e275f135245f5a0fc", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.15507847543343098, "ground_truth": 0}, {"key": "586458cf89c9c2ddc5a7925e275f135245f5a0fc", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.6859494440246063, "ground_truth": 0}, {"key": "586458cf89c9c2ddc5a7925e275f135245f5a0fc", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.16344543338373285, "ground_truth": 0}, {"key": "586458cf89c9c2ddc5a7925e275f135245f5a0fc", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.2798285127531831, "ground_truth": 0}, {"key": "586458cf89c9c2ddc5a7925e275f135245f5a0fc", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.05070536405635707, "ground_truth": 0}, {"key": "8aca433d3662b6ffe76ef4026bdcd7cf784aacec", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.06903793205595535, "ground_truth": 0}, {"key": "8aca433d3662b6ffe76ef4026bdcd7cf784aacec", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.08819004423951878, "ground_truth": 0}, {"key": "8aca433d3662b6ffe76ef4026bdcd7cf784aacec", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.15002882715220606, "ground_truth": 0}, {"key": "8aca433d3662b6ffe76ef4026bdcd7cf784aacec", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.08819004855130735, "ground_truth": 0}, {"key": "8aca433d3662b6ffe76ef4026bdcd7cf784aacec", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.019946934640435354, "ground_truth": 0}, {"key": "066f8568d9c1c23ca3aeb23330123e7dd8967208", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.13296423859611295, "ground_truth": 0}, {"key": "066f8568d9c1c23ca3aeb23330123e7dd8967208", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.035813193594530654, "ground_truth": 0}, {"key": "066f8568d9c1c23ca3aeb23330123e7dd8967208", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.07004896314885461, "ground_truth": 0}, {"key": "066f8568d9c1c23ca3aeb23330123e7dd8967208", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.10158945233033678, "ground_truth": 0}, {"key": "066f8568d9c1c23ca3aeb23330123e7dd8967208", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.04336580130485797, "ground_truth": 0}, {"key": "6589398915f67576609586704d5bcca6538c4727", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.15002881760986767, "ground_truth": 0}, {"key": "6589398915f67576609586704d5bcca6538c4727", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.10818895181074731, "ground_truth": 0}, {"key": "6589398915f67576609586704d5bcca6538c4727", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.22067816424708514, "ground_truth": 0}, {"key": "6589398915f67576609586704d5bcca6538c4727", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.19744445613295666, "ground_truth": 0}, {"key": "6589398915f67576609586704d5bcca6538c4727", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.050330630600057345, "ground_truth": 0}, {"key": "cb4d9818866490b281e8f5529c9957ba366390e7", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.39793841598925184, "ground_truth": 0}, {"key": "cb4d9818866490b281e8f5529c9957ba366390e7", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.7739006235063436, "ground_truth": 0}, {"key": "cb4d9818866490b281e8f5529c9957ba366390e7", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.674050478932117, "ground_truth": 0}, {"key": "cb4d9818866490b281e8f5529c9957ba366390e7", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.5389831943698573, "ground_truth": 0}, {"key": "cb4d9818866490b281e8f5529c9957ba366390e7", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.6967842461198641, "ground_truth": 0}, {"key": "83181eb5628b02f9af1cf8be0b9e3d7841f6f94c", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.008511303085121696, "ground_truth": 0}, {"key": "83181eb5628b02f9af1cf8be0b9e3d7841f6f94c", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.047425872873144474, "ground_truth": 0}, {"key": "83181eb5628b02f9af1cf8be0b9e3d7841f6f94c", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.01196109888810549, "ground_truth": 0}, {"key": "83181eb5628b02f9af1cf8be0b9e3d7841f6f94c", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.07696083743302917, "ground_truth": 0}, {"key": "83181eb5628b02f9af1cf8be0b9e3d7841f6f94c", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.056236345417450505, "ground_truth": 0}, {"key": "addda21620885e1019305bce0cbf308b421dc0ba", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.3629691937691142, "ground_truth": 0}, {"key": "addda21620885e1019305bce0cbf308b421dc0ba", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.1550784824168464, "ground_truth": 0}, {"key": "addda21620885e1019305bce0cbf308b421dc0ba", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.09203286560445209, "ground_truth": 0}, {"key": "addda21620885e1019305bce0cbf308b421dc0ba", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.10158944942526968, "ground_truth": 0}, {"key": "addda21620885e1019305bce0cbf308b421dc0ba", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.27669053970850005, "ground_truth": 0}, {"key": "6a0a6f44de4059e1d7ef83841b3fd5e95e278ba2", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.07107366577355538, "ground_truth": 0}, {"key": "6a0a6f44de4059e1d7ef83841b3fd5e95e278ba2", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.2240554604972277, "ground_truth": 0}, {"key": "6a0a6f44de4059e1d7ef83841b3fd5e95e278ba2", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.14128141027786384, "ground_truth": 0}, {"key": "6a0a6f44de4059e1d7ef83841b3fd5e95e278ba2", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.1677633501695471, "ground_truth": 0}, {"key": "6a0a6f44de4059e1d7ef83841b3fd5e95e278ba2", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.11357958903212036, "ground_truth": 0}, {"key": "b5313efdec6d9afa6f43f26378c6065fcc9c7535", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.038321973582878754, "ground_truth": 0}, {"key": "b5313efdec6d9afa6f43f26378c6065fcc9c7535", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.04795810407914795, "ground_truth": 0}, {"key": "b5313efdec6d9afa6f43f26378c6065fcc9c7535", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.06210312513460422, "ground_truth": 0}, {"key": "b5313efdec6d9afa6f43f26378c6065fcc9c7535", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.15304215254864598, "ground_truth": 0}, {"key": "b5313efdec6d9afa6f43f26378c6065fcc9c7535", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.19253935259557145, "ground_truth": 0}, {"key": "0644f27692b67af8f52f9518e29981de11684cd7", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.45519859844289073, "ground_truth": 0}, {"key": "0644f27692b67af8f52f9518e29981de11684cd7", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.632502726897537, "ground_truth": 0}, {"key": "0644f27692b67af8f52f9518e29981de11684cd7", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.6132365425844719, "ground_truth": 0}, {"key": "0644f27692b67af8f52f9518e29981de11684cd7", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.4921881543251016, "ground_truth": 0}, {"key": "0644f27692b67af8f52f9518e29981de11684cd7", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.8582440010150701, "ground_truth": 0}, {"key": "19dbfe3918d9bdd7b5f1792631c5e3e424146473", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.30569733270562144, "ground_truth": 0}, {"key": "19dbfe3918d9bdd7b5f1792631c5e3e424146473", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.35220178949097286, "ground_truth": 0}, {"key": "19dbfe3918d9bdd7b5f1792631c5e3e424146473", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.14128141418983076, "ground_truth": 0}, {"key": "19dbfe3918d9bdd7b5f1792631c5e3e424146473", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.1412814129559743, "ground_truth": 0}, {"key": "19dbfe3918d9bdd7b5f1792631c5e3e424146473", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.24220563206252438, "ground_truth": 0}, {"key": "0f4fcaf8fd58c40bc31c4715cd230bb0f80f2d98", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.21933749531143473, "ground_truth": 0}, {"key": "0f4fcaf8fd58c40bc31c4715cd230bb0f80f2d98", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.6901415566688769, "ground_truth": 0}, {"key": "0f4fcaf8fd58c40bc31c4715cd230bb0f80f2d98", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.3504213721211932, "ground_truth": 0}, {"key": "0f4fcaf8fd58c40bc31c4715cd230bb0f80f2d98", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.2160115329461621, "ground_truth": 0}, {"key": "0f4fcaf8fd58c40bc31c4715cd230bb0f80f2d98", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.38306417983472824, "ground_truth": 0}, {"key": "4aa90d4a364e8bd252a2a2e57f1bb4c9dab57062", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.09235979673515987, "ground_truth": 0}, {"key": "4aa90d4a364e8bd252a2a2e57f1bb4c9dab57062", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.5428632607116648, "ground_truth": 0}, {"key": "4aa90d4a364e8bd252a2a2e57f1bb4c9dab57062", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.1167640043920925, "ground_truth": 0}, {"key": "4aa90d4a364e8bd252a2a2e57f1bb4c9dab57062", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.14033624644452142, "ground_truth": 0}, {"key": "4aa90d4a364e8bd252a2a2e57f1bb4c9dab57062", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.3557748859283002, "ground_truth": 0}, {"key": "239d0e3b504e4b9e1e6eb20eb77c8a873a2f5657", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.05379964684102494, "ground_truth": 0}, {"key": "239d0e3b504e4b9e1e6eb20eb77c8a873a2f5657", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.07185127204165583, "ground_truth": 0}, {"key": "239d0e3b504e4b9e1e6eb20eb77c8a873a2f5657", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.03296124546380386, "ground_truth": 0}, {"key": "239d0e3b504e4b9e1e6eb20eb77c8a873a2f5657", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.04352814240072065, "ground_truth": 0}, {"key": "239d0e3b504e4b9e1e6eb20eb77c8a873a2f5657", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.10411240372935246, "ground_truth": 0}, {"key": "6ef705715b84a961f971d624e9574da6a65dd3ef", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.4092207927016353, "ground_truth": 0}, {"key": "6ef705715b84a961f971d624e9574da6a65dd3ef", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.32594952673685124, "ground_truth": 0}, {"key": "6ef705715b84a961f971d624e9574da6a65dd3ef", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.13753247165662313, "ground_truth": 0}, {"key": "6ef705715b84a961f971d624e9574da6a65dd3ef", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.5467381502423199, "ground_truth": 0}, {"key": "6ef705715b84a961f971d624e9574da6a65dd3ef", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.6270381376922919, "ground_truth": 0}, {"key": "e3f24714630bd679c4b4fdb77e90f785beb1ff33", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.6442251201469699, "ground_truth": 0}, {"key": "e3f24714630bd679c4b4fdb77e90f785beb1ff33", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.3923368467642331, "ground_truth": 0}, {"key": "e3f24714630bd679c4b4fdb77e90f785beb1ff33", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.12808824410645422, "ground_truth": 0}, {"key": "e3f24714630bd679c4b4fdb77e90f785beb1ff33", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.26435836364274706, "ground_truth": 0}, {"key": "e3f24714630bd679c4b4fdb77e90f785beb1ff33", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.11008787787015874, "ground_truth": 0}, {"key": "589dc58218fe8920f0949cc7af767b6daf5018bc", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.08329192895795265, "ground_truth": 0}, {"key": "589dc58218fe8920f0949cc7af767b6daf5018bc", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.14033625321487653, "ground_truth": 0}, {"key": "589dc58218fe8920f0949cc7af767b6daf5018bc", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.5544704661247764, "ground_truth": 0}, {"key": "589dc58218fe8920f0949cc7af767b6daf5018bc", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.20561504838140043, "ground_truth": 0}, {"key": "589dc58218fe8920f0949cc7af767b6daf5018bc", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.07423136405538859, "ground_truth": 0}, {"key": "06254d21e94c9c0b027629a1df90298887c31f14", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.668880251777786, "ground_truth": 0}, {"key": "06254d21e94c9c0b027629a1df90298887c31f14", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.490235614448652, "ground_truth": 0}, {"key": "06254d21e94c9c0b027629a1df90298887c31f14", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.6442251187420177, "ground_truth": 0}, {"key": "06254d21e94c9c0b027629a1df90298887c31f14", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.7620701019772499, "ground_truth": 0}, {"key": "06254d21e94c9c0b027629a1df90298887c31f14", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.9019206722736387, "ground_truth": 0}, {"key": "5b93cafa2843ab23eb5baf8bb0bec93d0fc46864", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.16667539996034275, "ground_truth": 0}, {"key": "5b93cafa2843ab23eb5baf8bb0bec93d0fc46864", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.12168575225711657, "ground_truth": 0}, {"key": "5b93cafa2843ab23eb5baf8bb0bec93d0fc46864", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.28616926356190736, "ground_truth": 0}, {"key": "5b93cafa2843ab23eb5baf8bb0bec93d0fc46864", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.24220564397461067, "ground_truth": 0}, {"key": "5b93cafa2843ab23eb5baf8bb0bec93d0fc46864", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.2018132147630002, "ground_truth": 0}, {"key": "22f9667453cf7ea8a39080edde645776d5edc6f7", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.5869964230501317, "ground_truth": 0}, {"key": "22f9667453cf7ea8a39080edde645776d5edc6f7", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.5136684688848363, "ground_truth": 0}, {"key": "22f9667453cf7ea8a39080edde645776d5edc6f7", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.45713672847358366, "ground_truth": 0}, {"key": "22f9667453cf7ea8a39080edde645776d5edc6f7", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.071591202472373, "ground_truth": 0}, {"key": "22f9667453cf7ea8a39080edde645776d5edc6f7", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.1490353071672037, "ground_truth": 0}, {"key": "521fc18da417d441ba600a4abdbf279bb0c8f69d", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.27825680380032425, "ground_truth": 0}, {"key": "521fc18da417d441ba600a4abdbf279bb0c8f69d", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.18594721161538982, "ground_truth": 0}, {"key": "521fc18da417d441ba600a4abdbf279bb0c8f69d", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.1634454348912101, "ground_truth": 0}, {"key": "521fc18da417d441ba600a4abdbf279bb0c8f69d", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.23651623374441066, "ground_truth": 0}, {"key": "521fc18da417d441ba600a4abdbf279bb0c8f69d", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.43206338790911925, "ground_truth": 0}, {"key": "48fd5553806beaaa508596b0c8267a1ee703a8fe", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.133415217574458, "ground_truth": 0}, {"key": "48fd5553806beaaa508596b0c8267a1ee703a8fe", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.19436782791655074, "ground_truth": 0}, {"key": "48fd5553806beaaa508596b0c8267a1ee703a8fe", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.21206881788669527, "ground_truth": 0}, {"key": "48fd5553806beaaa508596b0c8267a1ee703a8fe", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.16291204426179906, "ground_truth": 0}, {"key": "48fd5553806beaaa508596b0c8267a1ee703a8fe", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.13986564289968437, "ground_truth": 0}, {"key": "f9b3e0253b7325cd0d37841a38c9f10a22c77c49", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.140336253517299, "ground_truth": 0}, {"key": "f9b3e0253b7325cd0d37841a38c9f10a22c77c49", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.02153287749951707, "ground_truth": 0}, {"key": "f9b3e0253b7325cd0d37841a38c9f10a22c77c49", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.06560483433973807, "ground_truth": 0}, {"key": "f9b3e0253b7325cd0d37841a38c9f10a22c77c49", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.16776334552251657, "ground_truth": 0}, {"key": "f9b3e0253b7325cd0d37841a38c9f10a22c77c49", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.09807932614116362, "ground_truth": 0}, {"key": "3228a9d82b3829a4f09698b746db4036ebb38ad0", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.09739040263062099, "ground_truth": 0}, {"key": "3228a9d82b3829a4f09698b746db4036ebb38ad0", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.056652425311820624, "ground_truth": 0}, {"key": "3228a9d82b3829a4f09698b746db4036ebb38ad0", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.3007455886428638, "ground_truth": 0}, {"key": "3228a9d82b3829a4f09698b746db4036ebb38ad0", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.06754669526737392, "ground_truth": 0}, {"key": "3228a9d82b3829a4f09698b746db4036ebb38ad0", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.14608724482530758, "ground_truth": 0}, {"key": "ee02f2bd6eaf55c06fef208248197679d2d96897", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.4843800881714594, "ground_truth": 0}, {"key": "ee02f2bd6eaf55c06fef208248197679d2d96897", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.4111108478013976, "ground_truth": 0}, {"key": "ee02f2bd6eaf55c06fef208248197679d2d96897", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.5019531002651172, "ground_truth": 0}, {"key": "ee02f2bd6eaf55c06fef208248197679d2d96897", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.4668456035608052, "ground_truth": 0}, {"key": "ee02f2bd6eaf55c06fef208248197679d2d96897", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.5621764987109332, "ground_truth": 0}, {"key": "c8da607c6ffe49104ceacd4fe484581042e7f21a", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.3702253657971157, "ground_truth": 0}, {"key": "c8da607c6ffe49104ceacd4fe484581042e7f21a", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.04689925922188852, "ground_truth": 0}, {"key": "c8da607c6ffe49104ceacd4fe484581042e7f21a", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.12043881464086145, "ground_truth": 0}, {"key": "c8da607c6ffe49104ceacd4fe484581042e7f21a", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.2056150423514211, "ground_truth": 0}, {"key": "c8da607c6ffe49104ceacd4fe484581042e7f21a", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.136148309764961, "ground_truth": 0}, {"key": "aeca50944e5a49735193304117849531fb4d667d", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.3293917241889954, "ground_truth": 0}, {"key": "aeca50944e5a49735193304117849531fb4d667d", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.14903530440504975, "ground_truth": 0}, {"key": "aeca50944e5a49735193304117849531fb4d667d", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.10158944252357892, "ground_truth": 0}, {"key": "aeca50944e5a49735193304117849531fb4d667d", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.049589024123166146, "ground_truth": 0}, {"key": "aeca50944e5a49735193304117849531fb4d667d", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.11357958954278155, "ground_truth": 0}, {"key": "301c27b4468420252a14f4c87c2b208c6b3259e1", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.4960938271793846, "ground_truth": 0}, {"key": "301c27b4468420252a14f4c87c2b208c6b3259e1", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.7461389718273056, "ground_truth": 0}, {"key": "301c27b4468420252a14f4c87c2b208c6b3259e1", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.4532618514511031, "ground_truth": 0}, {"key": "301c27b4468420252a14f4c87c2b208c6b3259e1", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.867485427694682, "ground_truth": 0}, {"key": "301c27b4468420252a14f4c87c2b208c6b3259e1", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.922202543866104, "ground_truth": 0}, {"key": "9b5fc45f61bff9323a7744c1db605618763cb85c", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.823328389616009, "ground_truth": 0}, {"key": "9b5fc45f61bff9323a7744c1db605618763cb85c", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.8697145866537556, "ground_truth": 0}, {"key": "9b5fc45f61bff9323a7744c1db605618763cb85c", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.8723473765990843, "ground_truth": 0}, {"key": "9b5fc45f61bff9323a7744c1db605618763cb85c", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.7806625056894585, "ground_truth": 0}, {"key": "9b5fc45f61bff9323a7744c1db605618763cb85c", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.8966140366855975, "ground_truth": 0}, {"key": "43144b95b0f947f2c6d40122fecd69ced8a4af92", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.04940524393689877, "ground_truth": 0}, {"key": "43144b95b0f947f2c6d40122fecd69ced8a4af92", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.012241275119890569, "ground_truth": 0}, {"key": "43144b95b0f947f2c6d40122fecd69ced8a4af92", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.14128142007102776, "ground_truth": 0}, {"key": "43144b95b0f947f2c6d40122fecd69ced8a4af92", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.021948254065301893, "ground_truth": 0}, {"key": "43144b95b0f947f2c6d40122fecd69ced8a4af92", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.10669059866155318, "ground_truth": 0}, {"key": "58b49fef1d6d2be5211848adc2882b59f043a933", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.32082130254584196, "ground_truth": 0}, {"key": "58b49fef1d6d2be5211848adc2882b59f043a933", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.2509127800474445, "ground_truth": 0}, {"key": "58b49fef1d6d2be5211848adc2882b59f043a933", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.45713672819671386, "ground_truth": 0}, {"key": "58b49fef1d6d2be5211848adc2882b59f043a933", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.06804042560375345, "ground_truth": 0}, {"key": "58b49fef1d6d2be5211848adc2882b59f043a933", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.357567540342204, "ground_truth": 0}, {"key": "bdcc1253f679b14e54451db44f4f0e39af4bb559", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.21206880206770634, "ground_truth": 0}, {"key": "bdcc1253f679b14e54451db44f4f0e39af4bb559", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.3812195771734646, "ground_truth": 0}, {"key": "bdcc1253f679b14e54451db44f4f0e39af4bb559", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.5175708922949301, "ground_truth": 0}, {"key": "bdcc1253f679b14e54451db44f4f0e39af4bb559", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.2643583710864046, "ground_truth": 0}, {"key": "bdcc1253f679b14e54451db44f4f0e39af4bb559", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.23370634661212014, "ground_truth": 0}, {"key": "b22b1636da5dd15364b6f0c342e4ce4903e51c2a", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.2056150550114634, "ground_truth": 0}, {"key": "b22b1636da5dd15364b6f0c342e4ce4903e51c2a", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.195594092618616, "ground_truth": 0}, {"key": "b22b1636da5dd15364b6f0c342e4ce4903e51c2a", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.2814056035146722, "ground_truth": 0}, {"key": "b22b1636da5dd15364b6f0c342e4ce4903e51c2a", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.09334687729318593, "ground_truth": 0}, {"key": "b22b1636da5dd15364b6f0c342e4ce4903e51c2a", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.11596071433732204, "ground_truth": 0}, {"key": "55986d11e0d0e5b031567157cf1f157610c65c31", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.22000708684946377, "ground_truth": 0}, {"key": "55986d11e0d0e5b031567157cf1f157610c65c31", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.028007520962072343, "ground_truth": 0}, {"key": "55986d11e0d0e5b031567157cf1f157610c65c31", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.06394842093606617, "ground_truth": 0}, {"key": "55986d11e0d0e5b031567157cf1f157610c65c31", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.1147647857618803, "ground_truth": 0}, {"key": "55986d11e0d0e5b031567157cf1f157610c65c31", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.05242456197882248, "ground_truth": 0}, {"key": "0a37124fe35e31ae9fe8dd7715aeed88002e23e9", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.019124036946366798, "ground_truth": 0}, {"key": "0a37124fe35e31ae9fe8dd7715aeed88002e23e9", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.06828854302175598, "ground_truth": 0}, {"key": "0a37124fe35e31ae9fe8dd7715aeed88002e23e9", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.08509904351090526, "ground_truth": 0}, {"key": "0a37124fe35e31ae9fe8dd7715aeed88002e23e9", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.05500528426910462, "ground_truth": 0}, {"key": "0a37124fe35e31ae9fe8dd7715aeed88002e23e9", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.23091975381829255, "ground_truth": 0}, {"key": "ef3ee3ab85ed8802b6b76444bccb46256077963e", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.03527754647940153, "ground_truth": 0}, {"key": "ef3ee3ab85ed8802b6b76444bccb46256077963e", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.36658973917032306, "ground_truth": 0}, {"key": "ef3ee3ab85ed8802b6b76444bccb46256077963e", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.20307462629466647, "ground_truth": 0}, {"key": "ef3ee3ab85ed8802b6b76444bccb46256077963e", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.15304215650550315, "ground_truth": 0}, {"key": "ef3ee3ab85ed8802b6b76444bccb46256077963e", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.22135069161283896, "ground_truth": 0}, {"key": "fb17ac082bd3f3af3dad8c8d36d9ea56360c520e", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.6706082928231925, "ground_truth": 0}, {"key": "fb17ac082bd3f3af3dad8c8d36d9ea56360c520e", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.47073663897490353, "ground_truth": 0}, {"key": "fb17ac082bd3f3af3dad8c8d36d9ea56360c520e", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.7766229379612558, "ground_truth": 0}, {"key": "fb17ac082bd3f3af3dad8c8d36d9ea56360c520e", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.7025300580875901, "ground_truth": 0}, {"key": "fb17ac082bd3f3af3dad8c8d36d9ea56360c520e", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.8587185830603395, "ground_truth": 0}, {"key": "59f079f6095cbb82b0eaaa0ba5fc29cdaff1f81b", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.15713684645605847, "ground_truth": 0}, {"key": "59f079f6095cbb82b0eaaa0ba5fc29cdaff1f81b", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.08945460456712331, "ground_truth": 0}, {"key": "59f079f6095cbb82b0eaaa0ba5fc29cdaff1f81b", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.025565213648482858, "ground_truth": 0}, {"key": "59f079f6095cbb82b0eaaa0ba5fc29cdaff1f81b", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.05582313897182573, "ground_truth": 0}, {"key": "59f079f6095cbb82b0eaaa0ba5fc29cdaff1f81b", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.22678363932185122, "ground_truth": 0}, {"key": "083bc4309f2ea52be2a378e78566d7dcc9f4dd73", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.42441199869124946, "ground_truth": 0}, {"key": "083bc4309f2ea52be2a378e78566d7dcc9f4dd73", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.4863315078492445, "ground_truth": 0}, {"key": "083bc4309f2ea52be2a378e78566d7dcc9f4dd73", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.5736784094962355, "ground_truth": 0}, {"key": "083bc4309f2ea52be2a378e78566d7dcc9f4dd73", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.4378234877417024, "ground_truth": 0}, {"key": "083bc4309f2ea52be2a378e78566d7dcc9f4dd73", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.64601370499869, "ground_truth": 0}, {"key": "ac56bd50e449bfa1d7b923415afa2ae5f7c83392", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.4225046222991987, "ground_truth": 0}, {"key": "ac56bd50e449bfa1d7b923415afa2ae5f7c83392", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.17217185430964277, "ground_truth": 0}, {"key": "ac56bd50e449bfa1d7b923415afa2ae5f7c83392", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.09203286213058823, "ground_truth": 0}, {"key": "ac56bd50e449bfa1d7b923415afa2ae5f7c83392", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.3140505596486705, "ground_truth": 0}, {"key": "ac56bd50e449bfa1d7b923415afa2ae5f7c83392", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.12252321717583695, "ground_truth": 0}, {"key": "61e4747776bd844146a9b8c7c1913c827ffbcd8a", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.6169358145197451, "ground_truth": 0}, {"key": "61e4747776bd844146a9b8c7c1913c827ffbcd8a", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.7025300666334487, "ground_truth": 0}, {"key": "61e4747776bd844146a9b8c7c1913c827ffbcd8a", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.6992544115371734, "ground_truth": 0}, {"key": "61e4747776bd844146a9b8c7c1913c827ffbcd8a", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.7759445394227933, "ground_truth": 0}, {"key": "61e4747776bd844146a9b8c7c1913c827ffbcd8a", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.5621765073120162, "ground_truth": 0}, {"key": "a9854fc40719b0d083a3fd279b6196188228a4e0", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.299105188921857, "ground_truth": 0}, {"key": "a9854fc40719b0d083a3fd279b6196188228a4e0", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.15507847704790031, "ground_truth": 0}, {"key": "a9854fc40719b0d083a3fd279b6196188228a4e0", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.527316527461629, "ground_truth": 0}, {"key": "a9854fc40719b0d083a3fd279b6196188228a4e0", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.339827615272588, "ground_truth": 0}, {"key": "a9854fc40719b0d083a3fd279b6196188228a4e0", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.40544873251799823, "ground_truth": 0}, {"key": "8d37ab9fcd0248c093f6d0e5682782ebdaf5e837", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.2560871237263085, "ground_truth": 0}, {"key": "8d37ab9fcd0248c093f6d0e5682782ebdaf5e837", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.2814055838605607, "ground_truth": 0}, {"key": "8d37ab9fcd0248c093f6d0e5682782ebdaf5e837", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.5175708755935988, "ground_truth": 0}, {"key": "8d37ab9fcd0248c093f6d0e5682782ebdaf5e837", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.5869964317762424, "ground_truth": 0}, {"key": "8d37ab9fcd0248c093f6d0e5682782ebdaf5e837", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.40733338672336916, "ground_truth": 0}, {"key": "d3199d123dedcdbae55b2e9d1f658717c1d5e233", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.00891612627771583, "ground_truth": 0}, {"key": "d3199d123dedcdbae55b2e9d1f658717c1d5e233", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.013532149068103648, "ground_truth": 0}, {"key": "d3199d123dedcdbae55b2e9d1f658717c1d5e233", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.025371310798474808, "ground_truth": 0}, {"key": "d3199d123dedcdbae55b2e9d1f658717c1d5e233", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.006850479861287835, "ground_truth": 0}, {"key": "d3199d123dedcdbae55b2e9d1f658717c1d5e233", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.007846239259910768, "ground_truth": 0}, {"key": "f249ede5a3cafd2506ff2bb400291a7db1c43b76", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.0844927544777269, "ground_truth": 0}, {"key": "f249ede5a3cafd2506ff2bb400291a7db1c43b76", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.12168575707310876, "ground_truth": 0}, {"key": "f249ede5a3cafd2506ff2bb400291a7db1c43b76", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.10743746989794441, "ground_truth": 0}, {"key": "f249ede5a3cafd2506ff2bb400291a7db1c43b76", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.06560483334184444, "ground_truth": 0}, {"key": "f249ede5a3cafd2506ff2bb400291a7db1c43b76", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.0721121985257791, "ground_truth": 0}, {"key": "6343a202a70e8c5d3bfa4042bfd087d78ca5805e", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.5506073604072796, "ground_truth": 0}, {"key": "6343a202a70e8c5d3bfa4042bfd087d78ca5805e", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.31573598402720693, "ground_truth": 0}, {"key": "6343a202a70e8c5d3bfa4042bfd087d78ca5805e", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.21601153460916026, "ground_truth": 0}, {"key": "6343a202a70e8c5d3bfa4042bfd087d78ca5805e", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.5888891543329589, "ground_truth": 0}, {"key": "6343a202a70e8c5d3bfa4042bfd087d78ca5805e", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.3040416826412, "ground_truth": 0}, {"key": "da0d41b431367b51fd995573cb498c10b7f64ca0", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.1143685323403225, "ground_truth": 0}, {"key": "da0d41b431367b51fd995573cb498c10b7f64ca0", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.15610490782786726, "ground_truth": 0}, {"key": "da0d41b431367b51fd995573cb498c10b7f64ca0", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.21337717074338555, "ground_truth": 0}, {"key": "da0d41b431367b51fd995573cb498c10b7f64ca0", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.08151975308197461, "ground_truth": 0}, {"key": "da0d41b431367b51fd995573cb498c10b7f64ca0", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.05320620342411651, "ground_truth": 0}, {"key": "0620ff5fa324a35b4be54bbd2de49b42bdd0d7c0", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.7279754388268534, "ground_truth": 0}, {"key": "0620ff5fa324a35b4be54bbd2de49b42bdd0d7c0", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.25982565371062033, "ground_truth": 0}, {"key": "0620ff5fa324a35b4be54bbd2de49b42bdd0d7c0", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.48047866875602413, "ground_truth": 0}, {"key": "0620ff5fa324a35b4be54bbd2de49b42bdd0d7c0", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.4785288517634892, "ground_truth": 0}, {"key": "0620ff5fa324a35b4be54bbd2de49b42bdd0d7c0", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.4130035704479536, "ground_truth": 0}, {"key": "f0eb8f9eee266512eb604a51b482833e202531d8", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.5273165391842809, "ground_truth": 0}, {"key": "f0eb8f9eee266512eb604a51b482833e202531d8", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.5907792153150727, "ground_truth": 0}, {"key": "f0eb8f9eee266512eb604a51b482833e202531d8", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.5869964206231129, "ground_truth": 0}, {"key": "f0eb8f9eee266512eb604a51b482833e202531d8", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.741674020115449, "ground_truth": 0}, {"key": "f0eb8f9eee266512eb604a51b482833e202531d8", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.4205995856785242, "ground_truth": 0}, {"key": "c8f743307d5d1f7f19f1474d68c9390b22f6d076", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.012920473000204007, "ground_truth": 0}, {"key": "c8f743307d5d1f7f19f1474d68c9390b22f6d076", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.06052939231164768, "ground_truth": 0}, {"key": "c8f743307d5d1f7f19f1474d68c9390b22f6d076", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.07159120099444617, "ground_truth": 0}, {"key": "c8f743307d5d1f7f19f1474d68c9390b22f6d076", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.010288300573499784, "ground_truth": 0}, {"key": "c8f743307d5d1f7f19f1474d68c9390b22f6d076", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.03608394099948562, "ground_truth": 0}, {"key": "5978abfdad91e604840a2dcc993df5ade9448e82", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.12678517036958378, "ground_truth": 0}, {"key": "5978abfdad91e604840a2dcc993df5ade9448e82", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.04434857945283033, "ground_truth": 0}, {"key": "5978abfdad91e604840a2dcc993df5ade9448e82", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.019568675396001847, "ground_truth": 0}, {"key": "5978abfdad91e604840a2dcc993df5ade9448e82", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.009783875489726278, "ground_truth": 0}, {"key": "5978abfdad91e604840a2dcc993df5ade9448e82", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.03541072768865364, "ground_truth": 0}, {"key": "5bcd4e61b39cc7ffff38ad88cd40afa208b18528", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.14366760424459243, "ground_truth": 0}, {"key": "5bcd4e61b39cc7ffff38ad88cd40afa208b18528", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.16344543393871816, "ground_truth": 0}, {"key": "5bcd4e61b39cc7ffff38ad88cd40afa208b18528", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.07133199848877698, "ground_truth": 0}, {"key": "5bcd4e61b39cc7ffff38ad88cd40afa208b18528", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.07004896191194958, "ground_truth": 0}, {"key": "5bcd4e61b39cc7ffff38ad88cd40afa208b18528", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.0894546014927466, "ground_truth": 0}, {"key": "44815c184e3013f07781311b30ec5ff009174738", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.42823339292273865, "ground_truth": 0}, {"key": "44815c184e3013f07781311b30ec5ff009174738", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.12336561911499093, "ground_truth": 0}, {"key": "44815c184e3013f07781311b30ec5ff009174738", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.38861801333788454, "ground_truth": 0}, {"key": "44815c184e3013f07781311b30ec5ff009174738", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.09073548258557819, "ground_truth": 0}, {"key": "44815c184e3013f07781311b30ec5ff009174738", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.30074558528719536, "ground_truth": 0}, {"key": "d7783bd2bf5ad92156962380342411c2eb068853", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.016979992432520602, "ground_truth": 0}, {"key": "d7783bd2bf5ad92156962380342411c2eb068853", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.0366313681066201, "ground_truth": 0}, {"key": "d7783bd2bf5ad92156962380342411c2eb068853", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.02169809984063409, "ground_truth": 0}, {"key": "d7783bd2bf5ad92156962380342411c2eb068853", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.021044567533234828, "ground_truth": 0}, {"key": "d7783bd2bf5ad92156962380342411c2eb068853", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.028114057198897955, "ground_truth": 0}, {"key": "4963edb0ad2703e9f6c54593149d9b81e7ada91f", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.23231014497330124, "ground_truth": 0}, {"key": "4963edb0ad2703e9f6c54593149d9b81e7ada91f", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.10631887680716255, "ground_truth": 0}, {"key": "4963edb0ad2703e9f6c54593149d9b81e7ada91f", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.12168574783871089, "ground_truth": 0}, {"key": "4963edb0ad2703e9f6c54593149d9b81e7ada91f", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.3225260100474815, "ground_truth": 0}, {"key": "4963edb0ad2703e9f6c54593149d9b81e7ada91f", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.15002882378442692, "ground_truth": 0}, {"key": "51b9a2d46dac43952e713874a5769be5ae350626", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.30239108062270914, "ground_truth": 0}, {"key": "51b9a2d46dac43952e713874a5769be5ae350626", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.21206880165637174, "ground_truth": 0}, {"key": "51b9a2d46dac43952e713874a5769be5ae350626", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.16026602707020451, "ground_truth": 0}, {"key": "51b9a2d46dac43952e713874a5769be5ae350626", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.14706452261325859, "ground_truth": 0}, {"key": "51b9a2d46dac43952e713874a5769be5ae350626", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.13206615935988752, "ground_truth": 0}, {"key": "d670da295571f998bd0864540e2acd109d077131", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.13296424044603727, "ground_truth": 0}, {"key": "d670da295571f998bd0864540e2acd109d077131", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.42441200373478205, "ground_truth": 0}, {"key": "d670da295571f998bd0864540e2acd109d077131", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.14608724704257808, "ground_truth": 0}, {"key": "d670da295571f998bd0864540e2acd109d077131", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.20307462139036198, "ground_truth": 0}, {"key": "d670da295571f998bd0864540e2acd109d077131", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.1267851642306516, "ground_truth": 0}, {"key": "f2f2246150d06734b2fab694a39bd8d693c7d255", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.03760863711624811, "ground_truth": 0}, {"key": "f2f2246150d06734b2fab694a39bd8d693c7d255", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.029090756383669734, "ground_truth": 0}, {"key": "f2f2246150d06734b2fab694a39bd8d693c7d255", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.06187598846294472, "ground_truth": 0}, {"key": "f2f2246150d06734b2fab694a39bd8d693c7d255", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.032344330276122976, "ground_truth": 0}, {"key": "f2f2246150d06734b2fab694a39bd8d693c7d255", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.06608537393485965, "ground_truth": 0}, {"key": "3cc0409612242093f34ea1d8ca1679f434955cff", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.6992544015304607, "ground_truth": 0}, {"key": "3cc0409612242093f34ea1d8ca1679f434955cff", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.5282900908661398, "ground_truth": 0}, {"key": "3cc0409612242093f34ea1d8ca1679f434955cff", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.10302442727945803, "ground_truth": 0}, {"key": "3cc0409612242093f34ea1d8ca1679f434955cff", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.5253688247738215, "ground_truth": 0}, {"key": "3cc0409612242093f34ea1d8ca1679f434955cff", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.3757064488166975, "ground_truth": 0}, {"key": "a67c4eaf797da7df18a715cd30c6cf11db96c954", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.08509904488267901, "ground_truth": 0}, {"key": "a67c4eaf797da7df18a715cd30c6cf11db96c954", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.08389038177174926, "ground_truth": 0}, {"key": "a67c4eaf797da7df18a715cd30c6cf11db96c954", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.1500288277719448, "ground_truth": 0}, {"key": "a67c4eaf797da7df18a715cd30c6cf11db96c954", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.12085323145633112, "ground_truth": 0}, {"key": "a67c4eaf797da7df18a715cd30c6cf11db96c954", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.20561503430357203, "ground_truth": 0}, {"key": "58456413c8bd03a8ce70eb0061af07c6a9824fc3", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.03832197445949579, "ground_truth": 0}, {"key": "58456413c8bd03a8ce70eb0061af07c6a9824fc3", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.02120611893821176, "ground_truth": 0}, {"key": "58456413c8bd03a8ce70eb0061af07c6a9824fc3", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.05899303256709128, "ground_truth": 0}, {"key": "58456413c8bd03a8ce70eb0061af07c6a9824fc3", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.033462934033133065, "ground_truth": 0}, {"key": "58456413c8bd03a8ce70eb0061af07c6a9824fc3", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.04054074057484454, "ground_truth": 0}, {"key": "da040b67082b56436ccc8479a4e435cbf892a1f2", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.16344543649759075, "ground_truth": 0}, {"key": "da040b67082b56436ccc8479a4e435cbf892a1f2", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.4668456116817401, "ground_truth": 0}, {"key": "da040b67082b56436ccc8479a4e435cbf892a1f2", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.46101677630576926, "ground_truth": 0}, {"key": "da040b67082b56436ccc8479a4e435cbf892a1f2", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.1403362431200608, "ground_truth": 0}, {"key": "da040b67082b56436ccc8479a4e435cbf892a1f2", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.41300357995755244, "ground_truth": 0}, {"key": "c71748bb246a2b05e676862b75b38fa03bf6646e", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.443600422436313, "ground_truth": 0}, {"key": "c71748bb246a2b05e676862b75b38fa03bf6646e", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.17781087963410813, "ground_truth": 0}, {"key": "c71748bb246a2b05e676862b75b38fa03bf6646e", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.7138307412825937, "ground_truth": 0}, {"key": "c71748bb246a2b05e676862b75b38fa03bf6646e", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.4054487352763193, "ground_truth": 0}, {"key": "c71748bb246a2b05e676862b75b38fa03bf6646e", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.5698526797532255, "ground_truth": 0}, {"key": "800f8dc06596c30444526bf31dd0db7504391a82", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.41679664664933, "ground_truth": 0}, {"key": "800f8dc06596c30444526bf31dd0db7504391a82", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.12168575883080453, "ground_truth": 0}, {"key": "800f8dc06596c30444526bf31dd0db7504391a82", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.32082130517792545, "ground_truth": 0}, {"key": "800f8dc06596c30444526bf31dd0db7504391a82", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.27825679735776565, "ground_truth": 0}, {"key": "800f8dc06596c30444526bf31dd0db7504391a82", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.857768106197292, "ground_truth": 0}, {"key": "3b0ed227dc7e5292e302183282d8bbe23d7b1db2", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.1907240200586997, "ground_truth": 0}, {"key": "3b0ed227dc7e5292e302183282d8bbe23d7b1db2", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.1023046989124491, "ground_truth": 0}, {"key": "3b0ed227dc7e5292e302183282d8bbe23d7b1db2", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.15304216345411348, "ground_truth": 0}, {"key": "3b0ed227dc7e5292e302183282d8bbe23d7b1db2", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.14608725075888365, "ground_truth": 0}, {"key": "3b0ed227dc7e5292e302183282d8bbe23d7b1db2", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.1225232063499122, "ground_truth": 0}, {"key": "1e713005e16983f75222235967c0cbeb0b944f80", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.11047114764276324, "ground_truth": 0}, {"key": "1e713005e16983f75222235967c0cbeb0b944f80", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.10017222596961774, "ground_truth": 0}, {"key": "1e713005e16983f75222235967c0cbeb0b944f80", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.1155608773611752, "ground_truth": 0}, {"key": "1e713005e16983f75222235967c0cbeb0b944f80", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.1436676168338244, "ground_truth": 0}, {"key": "1e713005e16983f75222235967c0cbeb0b944f80", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.14414885663416704, "ground_truth": 0}, {"key": "360ae10bc8bd30a2aca7bc6b7000e138af63adb1", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.08479540273729716, "ground_truth": 0}, {"key": "360ae10bc8bd30a2aca7bc6b7000e138af63adb1", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.08850466544537275, "ground_truth": 0}, {"key": "360ae10bc8bd30a2aca7bc6b7000e138af63adb1", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.11008787744874897, "ground_truth": 0}, {"key": "360ae10bc8bd30a2aca7bc6b7000e138af63adb1", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.07159120480695158, "ground_truth": 0}, {"key": "360ae10bc8bd30a2aca7bc6b7000e138af63adb1", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.6261241992845512, "ground_truth": 0}, {"key": "50e996059a005d15e3e89b5a3c3695309671ed34", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.23370635095125086, "ground_truth": 0}, {"key": "50e996059a005d15e3e89b5a3c3695309671ed34", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.17441028394184308, "ground_truth": 0}, {"key": "50e996059a005d15e3e89b5a3c3695309671ed34", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.1525365138148403, "ground_truth": 0}, {"key": "50e996059a005d15e3e89b5a3c3695309671ed34", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.10338596325595202, "ground_truth": 0}, {"key": "50e996059a005d15e3e89b5a3c3695309671ed34", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.33807713907305076, "ground_truth": 0}, {"key": "ccc7f6a2139593c47f6b5880f1e3eef9e7a69734", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.9750122043485752, "ground_truth": 0}, {"key": "ccc7f6a2139593c47f6b5880f1e3eef9e7a69734", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.9291838001310272, "ground_truth": 0}, {"key": "ccc7f6a2139593c47f6b5880f1e3eef9e7a69734", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.6279511925825018, "ground_truth": 0}, {"key": "ccc7f6a2139593c47f6b5880f1e3eef9e7a69734", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.339827637096794, "ground_truth": 0}, {"key": "ccc7f6a2139593c47f6b5880f1e3eef9e7a69734", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.6123096530161343, "ground_truth": 0}, {"key": "f4f90d4ff5af3e3648055673e040f0f43ae076d2", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.5832033525573523, "ground_truth": 0}, {"key": "f4f90d4ff5af3e3648055673e040f0f43ae076d2", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.5195213264621488, "ground_truth": 0}, {"key": "f4f90d4ff5af3e3648055673e040f0f43ae076d2", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.5331543803619131, "ground_truth": 0}, {"key": "f4f90d4ff5af3e3648055673e040f0f43ae076d2", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.37570648244156446, "ground_truth": 0}, {"key": "f4f90d4ff5af3e3648055673e040f0f43ae076d2", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.42250461463898753, "ground_truth": 0}, {"key": "6c9ec6b9d3e936d2394f74354d577fdfcdd985a3", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.12085323348151578, "ground_truth": 0}, {"key": "6c9ec6b9d3e936d2394f74354d577fdfcdd985a3", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.16995624189443925, "ground_truth": 0}, {"key": "6c9ec6b9d3e936d2394f74354d577fdfcdd985a3", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.06371499393131144, "ground_truth": 0}, {"key": "6c9ec6b9d3e936d2394f74354d577fdfcdd985a3", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.11596071569437714, "ground_truth": 0}, {"key": "6c9ec6b9d3e936d2394f74354d577fdfcdd985a3", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.18713268564276603, "ground_truth": 0}, {"key": "438a2046f4465fb1f6dab1cb327ef9ca86a4cc0d", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.04795810580738092, "ground_truth": 0}, {"key": "438a2046f4465fb1f6dab1cb327ef9ca86a4cc0d", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.15610490650944248, "ground_truth": 0}, {"key": "438a2046f4465fb1f6dab1cb327ef9ca86a4cc0d", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.10374862799477623, "ground_truth": 0}, {"key": "438a2046f4465fb1f6dab1cb327ef9ca86a4cc0d", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.07159120286793598, "ground_truth": 0}, {"key": "438a2046f4465fb1f6dab1cb327ef9ca86a4cc0d", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.04518375742744571, "ground_truth": 0}, {"key": "73818f6c987b3604b8bc92c4fb03bc68af196b77", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.11279539714565351, "ground_truth": 0}, {"key": "73818f6c987b3604b8bc92c4fb03bc68af196b77", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.10669059361567476, "ground_truth": 0}, {"key": "73818f6c987b3604b8bc92c4fb03bc68af196b77", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.025371311613735313, "ground_truth": 0}, {"key": "73818f6c987b3604b8bc92c4fb03bc68af196b77", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.0041987952669091805, "ground_truth": 0}, {"key": "73818f6c987b3604b8bc92c4fb03bc68af196b77", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.05419872858112105, "ground_truth": 0}, {"key": "f06d91f46326752b02cdc48e8fa472dcc38a0846", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.3363310469239726, "ground_truth": 0}, {"key": "f06d91f46326752b02cdc48e8fa472dcc38a0846", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.09877258932839834, "ground_truth": 0}, {"key": "f06d91f46326752b02cdc48e8fa472dcc38a0846", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.22405546475112736, "ground_truth": 0}, {"key": "f06d91f46326752b02cdc48e8fa472dcc38a0846", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.15002882056203826, "ground_truth": 0}, {"key": "f06d91f46326752b02cdc48e8fa472dcc38a0846", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.21469140377356366, "ground_truth": 0}, {"key": "c54bee6384d58517757ad5a8a30ea6dc59980a07", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.06560483350111085, "ground_truth": 0}, {"key": "c54bee6384d58517757ad5a8a30ea6dc59980a07", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.021450730976255057, "ground_truth": 0}, {"key": "c54bee6384d58517757ad5a8a30ea6dc59980a07", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.034618839759076384, "ground_truth": 0}, {"key": "c54bee6384d58517757ad5a8a30ea6dc59980a07", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.022715757190176995, "ground_truth": 0}, {"key": "c54bee6384d58517757ad5a8a30ea6dc59980a07", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.07531230318366423, "ground_truth": 0}, {"key": "2757ff294ae08e977ed6a2b6e1854210f28f12c9", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.8080672094376594, "ground_truth": 0}, {"key": "2757ff294ae08e977ed6a2b6e1854210f28f12c9", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.9705764214850635, "ground_truth": 0}, {"key": "2757ff294ae08e977ed6a2b6e1854210f28f12c9", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.8610715695219924, "ground_truth": 0}, {"key": "2757ff294ae08e977ed6a2b6e1854210f28f12c9", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.8719117649047315, "ground_truth": 0}, {"key": "2757ff294ae08e977ed6a2b6e1854210f28f12c9", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.9118099607033333, "ground_truth": 0}, {"key": "6a004c991c482f664ab8ac78df0bda26860b1c7a", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.04304285229343671, "ground_truth": 0}, {"key": "6a004c991c482f664ab8ac78df0bda26860b1c7a", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.15921740597423048, "ground_truth": 0}, {"key": "6a004c991c482f664ab8ac78df0bda26860b1c7a", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.1561049059641258, "ground_truth": 0}, {"key": "6a004c991c482f664ab8ac78df0bda26860b1c7a", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.021125195012148774, "ground_truth": 0}, {"key": "6a004c991c482f664ab8ac78df0bda26860b1c7a", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.11201595581472254, "ground_truth": 0}, {"key": "69159eadf4dcb2b7850f3a4db6454f8209f33e3a", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.538012449165105, "ground_truth": 0}, {"key": "69159eadf4dcb2b7850f3a4db6454f8209f33e3a", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.2613309202256431, "ground_truth": 0}, {"key": "69159eadf4dcb2b7850f3a4db6454f8209f33e3a", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.3007455934855358, "ground_truth": 0}, {"key": "69159eadf4dcb2b7850f3a4db6454f8209f33e3a", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.18417984792402695, "ground_truth": 0}, {"key": "69159eadf4dcb2b7850f3a4db6454f8209f33e3a", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.46879061631870694, "ground_truth": 0}, {"key": "c6129a4c1fbd5680f512da18fb60a19a74f4959e", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.027795624638930386, "ground_truth": 0}, {"key": "c6129a4c1fbd5680f512da18fb60a19a74f4959e", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.18126320535154852, "ground_truth": 0}, {"key": "c6129a4c1fbd5680f512da18fb60a19a74f4959e", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.01905089833824734, "ground_truth": 0}, {"key": "c6129a4c1fbd5680f512da18fb60a19a74f4959e", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.09947021527846935, "ground_truth": 0}, {"key": "c6129a4c1fbd5680f512da18fb60a19a74f4959e", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.10447731939408389, "ground_truth": 0}, {"key": "1fe7d16db2c7a742dc1bcf04bfb8e285e7909f03", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.43974733592546544, "ground_truth": 0}, {"key": "1fe7d16db2c7a742dc1bcf04bfb8e285e7909f03", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.10374863195945803, "ground_truth": 0}, {"key": "1fe7d16db2c7a742dc1bcf04bfb8e285e7909f03", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.2829881294261167, "ground_truth": 0}, {"key": "1fe7d16db2c7a742dc1bcf04bfb8e285e7909f03", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.23792990306859438, "ground_truth": 0}, {"key": "1fe7d16db2c7a742dc1bcf04bfb8e285e7909f03", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.06853749408921546, "ground_truth": 0}, {"key": "e0ddf766661004eb3ff337d95e249073410f0755", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.35042136951064284, "ground_truth": 0}, {"key": "e0ddf766661004eb3ff337d95e249073410f0755", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.12852513510978364, "ground_truth": 0}, {"key": "e0ddf766661004eb3ff337d95e249073410f0755", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.14223188477998955, "ground_truth": 0}, {"key": "e0ddf766661004eb3ff337d95e249073410f0755", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.22953521057771423, "ground_truth": 0}, {"key": "e0ddf766661004eb3ff337d95e249073410f0755", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.29421496136080316, "ground_truth": 0}, {"key": "dd37d70b837b24247e9abafe8fb5bc5fae5de464", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.4186969233702181, "ground_truth": 0}, {"key": "dd37d70b837b24247e9abafe8fb5bc5fae5de464", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.31573596641597396, "ground_truth": 0}, {"key": "dd37d70b837b24247e9abafe8fb5bc5fae5de464", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.11357958503672762, "ground_truth": 0}, {"key": "dd37d70b837b24247e9abafe8fb5bc5fae5de464", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.10932482069609174, "ground_truth": 0}, {"key": "dd37d70b837b24247e9abafe8fb5bc5fae5de464", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.5428632836201917, "ground_truth": 0}, {"key": "6e3028e9ae17ab59abc7732fe840468ac9dcb60c", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.9039745042159325, "ground_truth": 0}, {"key": "6e3028e9ae17ab59abc7732fe840468ac9dcb60c", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.4130035852481101, "ground_truth": 0}, {"key": "6e3028e9ae17ab59abc7732fe840468ac9dcb60c", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.7520125574409918, "ground_truth": 0}, {"key": "6e3028e9ae17ab59abc7732fe840468ac9dcb60c", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.9307105867379816, "ground_truth": 0}, {"key": "6e3028e9ae17ab59abc7732fe840468ac9dcb60c", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.931462507498012, "ground_truth": 0}, {"key": "24d2f15f65bfb5608c75d19ba07fc410aab4d9c6", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.5660185647329976, "ground_truth": 0}, {"key": "24d2f15f65bfb5608c75d19ba07fc410aab4d9c6", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.6334102552209507, "ground_truth": 0}, {"key": "24d2f15f65bfb5608c75d19ba07fc410aab4d9c6", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.6039318251433968, "ground_truth": 0}, {"key": "24d2f15f65bfb5608c75d19ba07fc410aab4d9c6", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.8164063694972419, "ground_truth": 0}, {"key": "24d2f15f65bfb5608c75d19ba07fc410aab4d9c6", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.6859494462452465, "ground_truth": 0}, {"key": "698329cc7a8d796d7635bf59d2435aa22c1a38e6", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.503906171899096, "ground_truth": 0}, {"key": "698329cc7a8d796d7635bf59d2435aa22c1a38e6", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.11516223357655404, "ground_truth": 0}, {"key": "698329cc7a8d796d7635bf59d2435aa22c1a38e6", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.5039061592961231, "ground_truth": 0}, {"key": "698329cc7a8d796d7635bf59d2435aa22c1a38e6", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.2509127961161813, "ground_truth": 0}, {"key": "698329cc7a8d796d7635bf59d2435aa22c1a38e6", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.5136684630550369, "ground_truth": 0}, {"key": "b531a8ba685e8d461d0a491f35c9970c3dddf3dd", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.14608724025164135, "ground_truth": 0}, {"key": "b531a8ba685e8d461d0a491f35c9970c3dddf3dd", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.09670578595763116, "ground_truth": 0}, {"key": "b531a8ba685e8d461d0a491f35c9970c3dddf3dd", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.049222117271609196, "ground_truth": 0}, {"key": "b531a8ba685e8d461d0a491f35c9970c3dddf3dd", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.21866938690163967, "ground_truth": 0}, {"key": "b531a8ba685e8d461d0a491f35c9970c3dddf3dd", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.13206615063392466, "ground_truth": 0}, {"key": "5b0e686b4679910743337ce02b36dd71a5caf5eb", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.06371499298481305, "ground_truth": 0}, {"key": "5b0e686b4679910743337ce02b36dd71a5caf5eb", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.1853566171132991, "ground_truth": 0}, {"key": "5b0e686b4679910743337ce02b36dd71a5caf5eb", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.09401018958834606, "ground_truth": 0}, {"key": "5b0e686b4679910743337ce02b36dd71a5caf5eb", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.059646940270886406, "ground_truth": 0}, {"key": "5b0e686b4679910743337ce02b36dd71a5caf5eb", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.23934934131234423, "ground_truth": 0}, {"key": "980e6db610d9882443d61e36d955f02d983d3e76", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.23934933393561286, "ground_truth": 0}, {"key": "980e6db610d9882443d61e36d955f02d983d3e76", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.1778108708748016, "ground_truth": 0}, {"key": "980e6db610d9882443d61e36d955f02d983d3e76", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.09138210857096223, "ground_truth": 0}, {"key": "980e6db610d9882443d61e36d955f02d983d3e76", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.09073548208312193, "ground_truth": 0}, {"key": "980e6db610d9882443d61e36d955f02d983d3e76", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.39047583406390546, "ground_truth": 0}, {"key": "6c18984d8f30ce196e9399200dd15e373e699267", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.08269733860860821, "ground_truth": 0}, {"key": "6c18984d8f30ce196e9399200dd15e373e699267", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.03676946555032651, "ground_truth": 0}, {"key": "6c18984d8f30ce196e9399200dd15e373e699267", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.032222296751287426, "ground_truth": 0}, {"key": "6c18984d8f30ce196e9399200dd15e373e699267", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.04569203323191431, "ground_truth": 0}, {"key": "6c18984d8f30ce196e9399200dd15e373e699267", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.022457054646518527, "ground_truth": 0}, {"key": "e00f05efe2038fffc8eaa1e8eecbe9445a9483e5", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.4378234969832471, "ground_truth": 0}, {"key": "e00f05efe2038fffc8eaa1e8eecbe9445a9483e5", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.6001883287889874, "ground_truth": 0}, {"key": "e00f05efe2038fffc8eaa1e8eecbe9445a9483e5", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.4668456188224058, "ground_truth": 0}, {"key": "e00f05efe2038fffc8eaa1e8eecbe9445a9483e5", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.21601151825652304, "ground_truth": 0}, {"key": "e00f05efe2038fffc8eaa1e8eecbe9445a9483e5", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.4513265145293056, "ground_truth": 0}, {"key": "9ce109dc50fe4eca8b2d0c926d5dbd1df5f49187", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.1710611870170993, "ground_truth": 0}, {"key": "9ce109dc50fe4eca8b2d0c926d5dbd1df5f49187", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.0769608395624138, "ground_truth": 0}, {"key": "9ce109dc50fe4eca8b2d0c926d5dbd1df5f49187", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.0750407288190445, "ground_truth": 0}, {"key": "9ce109dc50fe4eca8b2d0c926d5dbd1df5f49187", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.07892587990867259, "ground_truth": 0}, {"key": "9ce109dc50fe4eca8b2d0c926d5dbd1df5f49187", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.19559407946239113, "ground_truth": 0}, {"key": "bbec538b4453859ee9c772c4de8f0eb28acd87c4", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.07864238306617002, "ground_truth": 0}, {"key": "bbec538b4453859ee9c772c4de8f0eb28acd87c4", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.06278920896715619, "ground_truth": 0}, {"key": "bbec538b4453859ee9c772c4de8f0eb28acd87c4", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.06853749297987231, "ground_truth": 0}, {"key": "bbec538b4453859ee9c772c4de8f0eb28acd87c4", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.05749327718122456, "ground_truth": 0}, {"key": "bbec538b4453859ee9c772c4de8f0eb28acd87c4", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.14608725102816086, "ground_truth": 0}, {"key": "c4e0587d1b8fcc06c2cc5cfcec42a34d314fbe44", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.18010665432709722, "ground_truth": 0}, {"key": "c4e0587d1b8fcc06c2cc5cfcec42a34d314fbe44", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.5717666014658105, "ground_truth": 0}, {"key": "c4e0587d1b8fcc06c2cc5cfcec42a34d314fbe44", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.2689414406974847, "ground_truth": 0}, {"key": "c4e0587d1b8fcc06c2cc5cfcec42a34d314fbe44", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.7505527642901305, "ground_truth": 0}, {"key": "c4e0587d1b8fcc06c2cc5cfcec42a34d314fbe44", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.1422318889665133, "ground_truth": 0}, {"key": "7eaaa5bfe35344ee85eeb871a4d31cd31b12965b", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.12002563260248951, "ground_truth": 0}, {"key": "7eaaa5bfe35344ee85eeb871a4d31cd31b12965b", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.11757213376415217, "ground_truth": 0}, {"key": "7eaaa5bfe35344ee85eeb871a4d31cd31b12965b", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.08540366654656512, "ground_truth": 0}, {"key": "7eaaa5bfe35344ee85eeb871a4d31cd31b12965b", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.025178843701463723, "ground_truth": 0}, {"key": "7eaaa5bfe35344ee85eeb871a4d31cd31b12965b", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.04304284763854761, "ground_truth": 0}, {"key": "9cce7373a54faccf5b5d1232c82afab9b29ab6b9", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.09807932163021985, "ground_truth": 0}, {"key": "9cce7373a54faccf5b5d1232c82afab9b29ab6b9", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.1441488471398945, "ground_truth": 0}, {"key": "9cce7373a54faccf5b5d1232c82afab9b29ab6b9", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.13939639010521016, "ground_truth": 0}, {"key": "9cce7373a54faccf5b5d1232c82afab9b29ab6b9", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.05480259104907164, "ground_truth": 0}, {"key": "9cce7373a54faccf5b5d1232c82afab9b29ab6b9", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.027066175721588183, "ground_truth": 0}, {"key": "1b37e549bbcec859711e5b2ef310e94deed4dc95", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.48925945561064527, "ground_truth": 0}, {"key": "1b37e549bbcec859711e5b2ef310e94deed4dc95", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.8407826089955194, "ground_truth": 0}, {"key": "1b37e549bbcec859711e5b2ef310e94deed4dc95", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.3328523306820243, "ground_truth": 0}, {"key": "1b37e549bbcec859711e5b2ef310e94deed4dc95", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.5525397119528148, "ground_truth": 0}, {"key": "1b37e549bbcec859711e5b2ef310e94deed4dc95", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.8895288363341332, "ground_truth": 0}, {"key": "da780ee614304d195bde3b7549313c02990d072e", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.05791808685868752, "ground_truth": 0}, {"key": "da780ee614304d195bde3b7549313c02990d072e", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.22953520477378772, "ground_truth": 0}, {"key": "da780ee614304d195bde3b7549313c02990d072e", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.1907240212847463, "ground_truth": 0}, {"key": "da780ee614304d195bde3b7549313c02990d072e", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.1655931243330176, "ground_truth": 0}, {"key": "da780ee614304d195bde3b7549313c02990d072e", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.06052938916169035, "ground_truth": 0}, {"key": "e24cdc200182d698a34f564ba71f4948ce6760e5", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.5813030698331362, "ground_truth": 0}, {"key": "e24cdc200182d698a34f564ba71f4948ce6760e5", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.5602526796176556, "ground_truth": 0}, {"key": "e24cdc200182d698a34f564ba71f4948ce6760e5", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.35220177238499334, "ground_truth": 0}, {"key": "e24cdc200182d698a34f564ba71f4948ce6760e5", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.474631185888555, "ground_truth": 0}, {"key": "e24cdc200182d698a34f564ba71f4948ce6760e5", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.18832398328643465, "ground_truth": 0}, {"key": "42483672c204aebcf7ba6e7d6ca4c628fe9a69e7", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.7008948100591055, "ground_truth": 0}, {"key": "42483672c204aebcf7ba6e7d6ca4c628fe9a69e7", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.47657964173459993, "ground_truth": 0}, {"key": "42483672c204aebcf7ba6e7d6ca4c628fe9a69e7", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.39233685681578584, "ground_truth": 0}, {"key": "42483672c204aebcf7ba6e7d6ca4c628fe9a69e7", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.5755880158981805, "ground_truth": 0}, {"key": "42483672c204aebcf7ba6e7d6ca4c628fe9a69e7", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.7648916153052603, "ground_truth": 0}, {"key": "3501c83d3dab4a2e4d2142522a4bf1510a64422a", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.05223085200796686, "ground_truth": 0}, {"key": "3501c83d3dab4a2e4d2142522a4bf1510a64422a", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.4311051126155292, "ground_truth": 0}, {"key": "3501c83d3dab4a2e4d2142522a4bf1510a64422a", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.2674081700134429, "ground_truth": 0}, {"key": "3501c83d3dab4a2e4d2142522a4bf1510a64422a", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.6169358112382028, "ground_truth": 0}, {"key": "3501c83d3dab4a2e4d2142522a4bf1510a64422a", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.5331544133609789, "ground_truth": 0}, {"key": "964589248c2d95ac3c734ad71283ca22ae4ecedf", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.43206337377678944, "ground_truth": 0}, {"key": "964589248c2d95ac3c734ad71283ca22ae4ecedf", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.29583986775843957, "ground_truth": 0}, {"key": "964589248c2d95ac3c734ad71283ca22ae4ecedf", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.19193279423622223, "ground_truth": 0}, {"key": "964589248c2d95ac3c734ad71283ca22ae4ecedf", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.3451052853934973, "ground_truth": 0}, {"key": "964589248c2d95ac3c734ad71283ca22ae4ecedf", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.4320633977059919, "ground_truth": 0}, {"key": "6b72550a663bcb7a64e242ede6da53b1f585ea71", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.03919513073370776, "ground_truth": 0}, {"key": "6b72550a663bcb7a64e242ede6da53b1f585ea71", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.08269734152933828, "ground_truth": 0}, {"key": "6b72550a663bcb7a64e242ede6da53b1f585ea71", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.02017731964234225, "ground_truth": 0}, {"key": "6b72550a663bcb7a64e242ede6da53b1f585ea71", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.03775027645092096, "ground_truth": 0}, {"key": "6b72550a663bcb7a64e242ede6da53b1f585ea71", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.2735743891617365, "ground_truth": 0}, {"key": "c96bdfc0463d994ddc858ad358fe59371be79352", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.20434190465168775, "ground_truth": 0}, {"key": "c96bdfc0463d994ddc858ad358fe59371be79352", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.7356416378284746, "ground_truth": 0}, {"key": "c96bdfc0463d994ddc858ad358fe59371be79352", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.3311197370051713, "ground_truth": 0}, {"key": "c96bdfc0463d994ddc858ad358fe59371be79352", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.09301680128327758, "ground_truth": 0}, {"key": "c96bdfc0463d994ddc858ad358fe59371be79352", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.27512973042801814, "ground_truth": 0}, {"key": "085dc5d706487da983655043b144952956cb3c5b", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.03308597795239961, "ground_truth": 0}, {"key": "085dc5d706487da983655043b144952956cb3c5b", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.020725061815691524, "ground_truth": 0}, {"key": "085dc5d706487da983655043b144952956cb3c5b", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.025371311588185865, "ground_truth": 0}, {"key": "085dc5d706487da983655043b144952956cb3c5b", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.0294235789642723, "ground_truth": 0}, {"key": "085dc5d706487da983655043b144952956cb3c5b", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.03875619723484454, "ground_truth": 0}, {"key": "1c1dc1da2f6ba045478e25e91c8e1b039ce4cc67", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.06903792895582493, "ground_truth": 0}, {"key": "1c1dc1da2f6ba045478e25e91c8e1b039ce4cc67", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.24798743728804634, "ground_truth": 0}, {"key": "1c1dc1da2f6ba045478e25e91c8e1b039ce4cc67", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.06954174263049502, "ground_truth": 0}, {"key": "1c1dc1da2f6ba045478e25e91c8e1b039ce4cc67", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.023330767996314086, "ground_truth": 0}, {"key": "1c1dc1da2f6ba045478e25e91c8e1b039ce4cc67", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.08035746502199045, "ground_truth": 0}, {"key": "da90eb668bfc66a5e70b2e6631a5ec1c9ffb2413", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.5851011794028848, "ground_truth": 0}, {"key": "da90eb668bfc66a5e70b2e6631a5ec1c9ffb2413", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.7325918518000691, "ground_truth": 0}, {"key": "da90eb668bfc66a5e70b2e6631a5ec1c9ffb2413", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.7201715154299956, "ground_truth": 0}, {"key": "da90eb668bfc66a5e70b2e6631a5ec1c9ffb2413", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.6566582691749682, "ground_truth": 0}, {"key": "da90eb668bfc66a5e70b2e6631a5ec1c9ffb2413", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.8392075635116193, "ground_truth": 0}, {"key": "717b1934db9eb0d7e5e2aef75cd54b29a6530a59", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.024423090435704, "ground_truth": 0}, {"key": "717b1934db9eb0d7e5e2aef75cd54b29a6530a59", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.0356785532013443, "ground_truth": 0}, {"key": "717b1934db9eb0d7e5e2aef75cd54b29a6530a59", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.1883239800638659, "ground_truth": 0}, {"key": "717b1934db9eb0d7e5e2aef75cd54b29a6530a59", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.024237634740594965, "ground_truth": 0}, {"key": "717b1934db9eb0d7e5e2aef75cd54b29a6530a59", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.13660840127272464, "ground_truth": 0}, {"key": "e493fe7f282adb10c6b9af18d41f0181f17341e5", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.0665691894928611, "ground_truth": 0}, {"key": "e493fe7f282adb10c6b9af18d41f0181f17341e5", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.10017222773905604, "ground_truth": 0}, {"key": "e493fe7f282adb10c6b9af18d41f0181f17341e5", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.05623634370449464, "ground_truth": 0}, {"key": "e493fe7f282adb10c6b9af18d41f0181f17341e5", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.08329192881773848, "ground_truth": 0}, {"key": "e493fe7f282adb10c6b9af18d41f0181f17341e5", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.22815650675933435, "ground_truth": 0}, {"key": "e510fc72b8ef595e45f1a510d0cad761ae1bd032", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.025083141815870565, "ground_truth": 0}, {"key": "e510fc72b8ef595e45f1a510d0cad761ae1bd032", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.07237402356368845, "ground_truth": 0}, {"key": "e510fc72b8ef595e45f1a510d0cad761ae1bd032", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.02341994321806947, "ground_truth": 0}, {"key": "e510fc72b8ef595e45f1a510d0cad761ae1bd032", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.09670578968720876, "ground_truth": 0}, {"key": "e510fc72b8ef595e45f1a510d0cad761ae1bd032", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.017442484879501296, "ground_truth": 0}, {"key": "564e02cb944ea00c02f9832ab968441b5c67332e", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.13477591801286962, "ground_truth": 0}, {"key": "564e02cb944ea00c02f9832ab968441b5c67332e", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.2877678009932578, "ground_truth": 0}, {"key": "564e02cb944ea00c02f9832ab968441b5c67332e", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.16667541018583837, "ground_truth": 0}, {"key": "564e02cb944ea00c02f9832ab968441b5c67332e", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.3040416823749954, "ground_truth": 0}, {"key": "564e02cb944ea00c02f9832ab968441b5c67332e", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.1919327873588635, "ground_truth": 0}, {"key": "dfd0cea6589cb8be40538b9f165781fbc2c7d796", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.2861692639567482, "ground_truth": 0}, {"key": "dfd0cea6589cb8be40538b9f165781fbc2c7d796", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.7969253781331765, "ground_truth": 0}, {"key": "dfd0cea6589cb8be40538b9f165781fbc2c7d796", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.8679338531263407, "ground_truth": 0}, {"key": "dfd0cea6589cb8be40538b9f165781fbc2c7d796", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.5156199128534413, "ground_truth": 0}, {"key": "dfd0cea6589cb8be40538b9f165781fbc2c7d796", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.3830641870455118, "ground_truth": 0}, {"key": "dbceded6ea7d8a0944ab3f44263f688f644a5c37", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.9701269075801454, "ground_truth": 0}, {"key": "dbceded6ea7d8a0944ab3f44263f688f644a5c37", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.9815951103694214, "ground_truth": 0}, {"key": "dbceded6ea7d8a0944ab3f44263f688f644a5c37", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.9860979412180139, "ground_truth": 0}, {"key": "dbceded6ea7d8a0944ab3f44263f688f644a5c37", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.9854404806957752, "ground_truth": 0}, {"key": "dbceded6ea7d8a0944ab3f44263f688f644a5c37", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.9872772902615646, "ground_truth": 0}, {"key": "305a7272b28da5bc5574487ca0a09f48b852788c", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.287767809951624, "ground_truth": 0}, {"key": "305a7272b28da5bc5574487ca0a09f48b852788c", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.4205996139859718, "ground_truth": 0}, {"key": "305a7272b28da5bc5574487ca0a09f48b852788c", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.40356685716297974, "ground_truth": 0}, {"key": "305a7272b28da5bc5574487ca0a09f48b852788c", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.3140505547229968, "ground_truth": 0}, {"key": "305a7272b28da5bc5574487ca0a09f48b852788c", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.35936413139819684, "ground_truth": 0}, {"key": "9814600b03458475607fa2e4e9f1637138b7c9bf", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.422504631600552, "ground_truth": 0}, {"key": "9814600b03458475607fa2e4e9f1637138b7c9bf", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.4765796647076962, "ground_truth": 0}, {"key": "9814600b03458475607fa2e4e9f1637138b7c9bf", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.5409238553462062, "ground_truth": 0}, {"key": "9814600b03458475607fa2e4e9f1637138b7c9bf", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.4054487319268414, "ground_truth": 0}, {"key": "9814600b03458475607fa2e4e9f1637138b7c9bf", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.37570647777622135, "ground_truth": 0}, {"key": "d16bff688345742ee8a1762cb6b82b49e4a065dd", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.01590639164853533, "ground_truth": 0}, {"key": "d16bff688345742ee8a1762cb6b82b49e4a065dd", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.021450730783366012, "ground_truth": 0}, {"key": "d16bff688345742ee8a1762cb6b82b49e4a065dd", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.05623634908548336, "ground_truth": 0}, {"key": "d16bff688345742ee8a1762cb6b82b49e4a065dd", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.02245705525740022, "ground_truth": 0}, {"key": "d16bff688345742ee8a1762cb6b82b49e4a065dd", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.03846619121986904, "ground_truth": 0}, {"key": "c85a7eb698c39c7465d1fe4ebbb50447329b5497", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.9319595790367842, "ground_truth": 0}, {"key": "c85a7eb698c39c7465d1fe4ebbb50447329b5497", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.5907792004548729, "ground_truth": 0}, {"key": "c85a7eb698c39c7465d1fe4ebbb50447329b5497", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.6388352841590885, "ground_truth": 0}, {"key": "c85a7eb698c39c7465d1fe4ebbb50447329b5497", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.949669366091756, "ground_truth": 0}, {"key": "c85a7eb698c39c7465d1fe4ebbb50447329b5497", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.5774953619719421, "ground_truth": 0}, {"key": "5f299d74b492be5e53e6bcf3a54d3c8a4b418a97", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.3259495232245309, "ground_truth": 0}, {"key": "5f299d74b492be5e53e6bcf3a54d3c8a4b418a97", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.42059959968719407, "ground_truth": 0}, {"key": "5f299d74b492be5e53e6bcf3a54d3c8a4b418a97", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.4824291227949293, "ground_truth": 0}, {"key": "5f299d74b492be5e53e6bcf3a54d3c8a4b418a97", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.3311197309738319, "ground_truth": 0}, {"key": "5f299d74b492be5e53e6bcf3a54d3c8a4b418a97", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.19559408406599652, "ground_truth": 0}, {"key": "5a4e46a4e18d31d1ef4d1087b1643a349f10dd14", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.13432104844616707, "ground_truth": 0}, {"key": "5a4e46a4e18d31d1ef4d1087b1643a349f10dd14", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.5698526556522283, "ground_truth": 0}, {"key": "5a4e46a4e18d31d1ef4d1087b1643a349f10dd14", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.10087861849132869, "ground_truth": 0}, {"key": "5a4e46a4e18d31d1ef4d1087b1643a349f10dd14", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.15405755207840818, "ground_truth": 0}, {"key": "5a4e46a4e18d31d1ef4d1087b1643a349f10dd14", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.10743747336837928, "ground_truth": 0}, {"key": "b6b7cbc40f51483708d53416719205f36c06f6df", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.2782567942966633, "ground_truth": 0}, {"key": "b6b7cbc40f51483708d53416719205f36c06f6df", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.403566888748965, "ground_truth": 0}, {"key": "b6b7cbc40f51483708d53416719205f36c06f6df", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.17328820363076788, "ground_truth": 0}, {"key": "b6b7cbc40f51483708d53416719205f36c06f6df", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.15203224620296804, "ground_truth": 0}, {"key": "b6b7cbc40f51483708d53416719205f36c06f6df", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.19072403013613973, "ground_truth": 0}, {"key": "7c0bda3744be6f7d95eef695e59a4e4001455a35", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.22953520132204527, "ground_truth": 0}, {"key": "7c0bda3744be6f7d95eef695e59a4e4001455a35", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.3557748751658883, "ground_truth": 0}, {"key": "7c0bda3744be6f7d95eef695e59a4e4001455a35", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.056236345708250195, "ground_truth": 0}, {"key": "7c0bda3744be6f7d95eef695e59a4e4001455a35", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.11201595647974077, "ground_truth": 0}, {"key": "7c0bda3744be6f7d95eef695e59a4e4001455a35", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.13846179008210688, "ground_truth": 0}, {"key": "f19b17438e69527f376e5d9efc74d19fbac6f755", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.5253688083126886, "ground_truth": 0}, {"key": "f19b17438e69527f376e5d9efc74d19fbac6f755", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.6132365632247715, "ground_truth": 0}, {"key": "f19b17438e69527f376e5d9efc74d19fbac6f755", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.6370308020774739, "ground_truth": 0}, {"key": "f19b17438e69527f376e5d9efc74d19fbac6f755", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.4824291041189672, "ground_truth": 0}, {"key": "f19b17438e69527f376e5d9efc74d19fbac6f755", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.3886180236028445, "ground_truth": 0}, {"key": "eb2fe21af9629392d61a4fabe6cad72130525f2f", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.11757214196177627, "ground_truth": 0}, {"key": "eb2fe21af9629392d61a4fabe6cad72130525f2f", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.09842541152768858, "ground_truth": 0}, {"key": "eb2fe21af9629392d61a4fabe6cad72130525f2f", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.13846179238580264, "ground_truth": 0}, {"key": "eb2fe21af9629392d61a4fabe6cad72130525f2f", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.1540575591103087, "ground_truth": 0}, {"key": "eb2fe21af9629392d61a4fabe6cad72130525f2f", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.13753247162286228, "ground_truth": 0}, {"key": "eebebdc4fa08a6e927ab958a39d91f888550afec", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.1081889553309991, "ground_truth": 0}, {"key": "eebebdc4fa08a6e927ab958a39d91f888550afec", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.5698526556522283, "ground_truth": 0}, {"key": "eebebdc4fa08a6e927ab958a39d91f888550afec", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.11279540272081487, "ground_truth": 0}, {"key": "eebebdc4fa08a6e927ab958a39d91f888550afec", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.11201595344368108, "ground_truth": 0}, {"key": "eebebdc4fa08a6e927ab958a39d91f888550afec", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.35756753593722634, "ground_truth": 0}, {"key": "94b15ad6efcd6d47dfcc242135be481fceb7f634", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.06418264212006147, "ground_truth": 0}, {"key": "94b15ad6efcd6d47dfcc242135be481fceb7f634", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.051653785422758745, "ground_truth": 0}, {"key": "94b15ad6efcd6d47dfcc242135be481fceb7f634", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.04008735957022031, "ground_truth": 0}, {"key": "94b15ad6efcd6d47dfcc242135be481fceb7f634", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.08570927662888359, "ground_truth": 0}, {"key": "94b15ad6efcd6d47dfcc242135be481fceb7f634", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.04115288725419077, "ground_truth": 0}, {"key": "504ed83e41a6a861927345f7a027ba53ad02237a", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.21933750171771052, "ground_truth": 0}, {"key": "504ed83e41a6a861927345f7a027ba53ad02237a", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.2814055838605607, "ground_truth": 0}, {"key": "504ed83e41a6a861927345f7a027ba53ad02237a", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.32082130710266527, "ground_truth": 0}, {"key": "504ed83e41a6a861927345f7a027ba53ad02237a", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.35398630991993185, "ground_truth": 0}, {"key": "504ed83e41a6a861927345f7a027ba53ad02237a", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.5214711698628078, "ground_truth": 0}, {"key": "42176b852f897ae19ef0cf39d598878c8ff0bced", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.46295858944124957, "ground_truth": 0}, {"key": "42176b852f897ae19ef0cf39d598878c8ff0bced", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.21337717216083746, "ground_truth": 0}, {"key": "42176b852f897ae19ef0cf39d598878c8ff0bced", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.23091975537721005, "ground_truth": 0}, {"key": "42176b852f897ae19ef0cf39d598878c8ff0bced", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.24653335100530543, "ground_truth": 0}, {"key": "42176b852f897ae19ef0cf39d598878c8ff0bced", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.23651623892269794, "ground_truth": 0}, {"key": "62ac534bf7e3e897b2726dddf2b7b6f7723362d4", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.1535491800642633, "ground_truth": 0}, {"key": "62ac534bf7e3e897b2726dddf2b7b6f7723362d4", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.07921032612782895, "ground_truth": 0}, {"key": "62ac534bf7e3e897b2726dddf2b7b6f7723362d4", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.17838265926411348, "ground_truth": 0}, {"key": "62ac534bf7e3e897b2726dddf2b7b6f7723362d4", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.31573596976534085, "ground_truth": 0}, {"key": "62ac534bf7e3e897b2726dddf2b7b6f7723362d4", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.08913693770505358, "ground_truth": 0}, {"key": "4ff05ae8454ad482f81911c5e4275b63466bea35", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.5945512654841915, "ground_truth": 0}, {"key": "4ff05ae8454ad482f81911c5e4275b63466bea35", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.466845601344564, "ground_truth": 0}, {"key": "4ff05ae8454ad482f81911c5e4275b63466bea35", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.30404168574545015, "ground_truth": 0}, {"key": "4ff05ae8454ad482f81911c5e4275b63466bea35", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.37204879722292034, "ground_truth": 0}, {"key": "4ff05ae8454ad482f81911c5e4275b63466bea35", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.747615953846493, "ground_truth": 0}, {"key": "16e86dc5e3fe27875ee927741542536ea7b7553b", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.6495786331861423, "ground_truth": 0}, {"key": "16e86dc5e3fe27875ee927741542536ea7b7553b", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.20689405802029853, "ground_truth": 0}, {"key": "16e86dc5e3fe27875ee927741542536ea7b7553b", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.30404167795504294, "ground_truth": 0}, {"key": "16e86dc5e3fe27875ee927741542536ea7b7553b", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.08449275825156768, "ground_truth": 0}, {"key": "16e86dc5e3fe27875ee927741542536ea7b7553b", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.1755380745293612, "ground_truth": 0}, {"key": "ad55d2f13db6732edcd716e09f527ed2df39946f", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.1225232173535128, "ground_truth": 0}, {"key": "ad55d2f13db6732edcd716e09f527ed2df39946f", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.07779745084951699, "ground_truth": 0}, {"key": "ad55d2f13db6732edcd716e09f527ed2df39946f", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.19314737911495, "ground_truth": 0}, {"key": "ad55d2f13db6732edcd716e09f527ed2df39946f", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.12378868598216289, "ground_truth": 0}, {"key": "ad55d2f13db6732edcd716e09f527ed2df39946f", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.22746933575577472, "ground_truth": 0}, {"key": "160228fe18f272761b969b08622ba868ad65b206", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.25091276218290637, "ground_truth": 0}, {"key": "160228fe18f272761b969b08622ba868ad65b206", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.5698526434667617, "ground_truth": 0}, {"key": "160228fe18f272761b969b08622ba868ad65b206", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.484380076059636, "ground_truth": 0}, {"key": "160228fe18f272761b969b08622ba868ad65b206", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.37570648306478954, "ground_truth": 0}, {"key": "160228fe18f272761b969b08622ba868ad65b206", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.4649015435517403, "ground_truth": 0}, {"key": "7ebb75bc91aa51d53b06fdbed7feb52d42612065", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.12635333621682396, "ground_truth": 0}, {"key": "7ebb75bc91aa51d53b06fdbed7feb52d42612065", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.1871326778303035, "ground_truth": 0}, {"key": "7ebb75bc91aa51d53b06fdbed7feb52d42612065", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.2094696976756511, "ground_truth": 0}, {"key": "7ebb75bc91aa51d53b06fdbed7feb52d42612065", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.33458944530878404, "ground_truth": 0}, {"key": "7ebb75bc91aa51d53b06fdbed7feb52d42612065", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.2583259618423192, "ground_truth": 0}, {"key": "a84e31bf36290e557a3080ad297177b6f18cdf84", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.030792165826270767, "ground_truth": 0}, {"key": "a84e31bf36290e557a3080ad297177b6f18cdf84", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.10970577254383823, "ground_truth": 0}, {"key": "a84e31bf36290e557a3080ad297177b6f18cdf84", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.23510838502350734, "ground_truth": 0}, {"key": "a84e31bf36290e557a3080ad297177b6f18cdf84", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.06804042123129629, "ground_truth": 0}, {"key": "a84e31bf36290e557a3080ad297177b6f18cdf84", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.06681232729136359, "ground_truth": 0}, {"key": "c43c7253f38ff2cd79770034ed9af3567cfaa811", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.25832597292855364, "ground_truth": 0}, {"key": "c43c7253f38ff2cd79770034ed9af3567cfaa811", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.15610490312196273, "ground_truth": 0}, {"key": "c43c7253f38ff2cd79770034ed9af3567cfaa811", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.4551986011239207, "ground_truth": 0}, {"key": "c43c7253f38ff2cd79770034ed9af3567cfaa811", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.2173375138518908, "ground_truth": 0}, {"key": "c43c7253f38ff2cd79770034ed9af3567cfaa811", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.20307462877155957, "ground_truth": 0}, {"key": "a4601415eafb5264a4bdc273de3a16365aefb35b", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.3942009445615951, "ground_truth": 0}, {"key": "a4601415eafb5264a4bdc273de3a16365aefb35b", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.3007455777748911, "ground_truth": 0}, {"key": "a4601415eafb5264a4bdc273de3a16365aefb35b", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.4054487232887811, "ground_truth": 0}, {"key": "a4601415eafb5264a4bdc273de3a16365aefb35b", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.21206881255369642, "ground_truth": 0}, {"key": "a4601415eafb5264a4bdc273de3a16365aefb35b", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.45132649965721433, "ground_truth": 0}, {"key": "91d43f137b3d928561fb62b200ae40aee4a34b73", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.16132023724077965, "ground_truth": 0}, {"key": "91d43f137b3d928561fb62b200ae40aee4a34b73", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.08632347827194804, "ground_truth": 0}, {"key": "91d43f137b3d928561fb62b200ae40aee4a34b73", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.20817893110117927, "ground_truth": 0}, {"key": "91d43f137b3d928561fb62b200ae40aee4a34b73", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.15921739717661812, "ground_truth": 0}, {"key": "91d43f137b3d928561fb62b200ae40aee4a34b73", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.23370634197427845, "ground_truth": 0}, {"key": "ab2d99eedfd685ce685fa44e735695c27e946683", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.022802637485314886, "ground_truth": 0}, {"key": "ab2d99eedfd685ce685fa44e735695c27e946683", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.28616926195762066, "ground_truth": 0}, {"key": "ab2d99eedfd685ce685fa44e735695c27e946683", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.19072402473274164, "ground_truth": 0}, {"key": "ab2d99eedfd685ce685fa44e735695c27e946683", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.13939637736957827, "ground_truth": 0}, {"key": "ab2d99eedfd685ce685fa44e735695c27e946683", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.13568954213142523, "ground_truth": 0}, {"key": "df9c4e1b8698581720b28c71f1e98f82bd6ea6e6", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.08181271404983972, "ground_truth": 0}, {"key": "df9c4e1b8698581720b28c71f1e98f82bd6ea6e6", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.034618841148707225, "ground_truth": 0}, {"key": "df9c4e1b8698581720b28c71f1e98f82bd6ea6e6", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.04240382961241405, "ground_truth": 0}, {"key": "df9c4e1b8698581720b28c71f1e98f82bd6ea6e6", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.13117323105171144, "ground_truth": 0}, {"key": "df9c4e1b8698581720b28c71f1e98f82bd6ea6e6", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.11920292229613155, "ground_truth": 0}, {"key": "a1d7a119707506100920e1a6f0d9cbf4d4e7c838", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.12506537809159993, "ground_truth": 0}, {"key": "a1d7a119707506100920e1a6f0d9cbf4d4e7c838", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.11008788647073442, "ground_truth": 0}, {"key": "a1d7a119707506100920e1a6f0d9cbf4d4e7c838", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.17781087324344394, "ground_truth": 0}, {"key": "a1d7a119707506100920e1a6f0d9cbf4d4e7c838", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.13386748566506776, "ground_truth": 0}, {"key": "a1d7a119707506100920e1a6f0d9cbf4d4e7c838", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.10302442498511272, "ground_truth": 0}, {"key": "acd2b851b367bf62dd603ebff5670ffa9c853a8f", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.017848737217925188, "ground_truth": 0}, {"key": "acd2b851b367bf62dd603ebff5670ffa9c853a8f", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.07316471983786209, "ground_truth": 0}, {"key": "acd2b851b367bf62dd603ebff5670ffa9c853a8f", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.275129715210464, "ground_truth": 0}, {"key": "acd2b851b367bf62dd603ebff5670ffa9c853a8f", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.14903530181377359, "ground_truth": 0}, {"key": "acd2b851b367bf62dd603ebff5670ffa9c853a8f", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.0609751818377271, "ground_truth": 0}, {"key": "b9f5a02386adb698ae71cadd3fd1825fa7b998db", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.3106943869481575, "ground_truth": 0}, {"key": "b9f5a02386adb698ae71cadd3fd1825fa7b998db", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.8962513703999235, "ground_truth": 0}, {"key": "b9f5a02386adb698ae71cadd3fd1825fa7b998db", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.7461389872020758, "ground_truth": 0}, {"key": "b9f5a02386adb698ae71cadd3fd1825fa7b998db", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.4687906253266124, "ground_truth": 0}, {"key": "b9f5a02386adb698ae71cadd3fd1825fa7b998db", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.6959583095668418, "ground_truth": 0}, {"key": "c26f356dc536e5797ba550be6e27a95059f1ce53", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.0700489645191019, "ground_truth": 0}, {"key": "c26f356dc536e5797ba550be6e27a95059f1ce53", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.13753247624322704, "ground_truth": 0}, {"key": "c26f356dc536e5797ba550be6e27a95059f1ce53", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.08210662965303721, "ground_truth": 0}, {"key": "c26f356dc536e5797ba550be6e27a95059f1ce53", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.08210663265344033, "ground_truth": 0}, {"key": "c26f356dc536e5797ba550be6e27a95059f1ce53", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.2861692440356671, "ground_truth": 0}, {"key": "94a9883a283e94c3ad53069d98517b08e8853447", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.2999247451622083, "ground_truth": 0}, {"key": "94a9883a283e94c3ad53069d98517b08e8853447", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.7217431971353394, "ground_truth": 0}, {"key": "94a9883a283e94c3ad53069d98517b08e8853447", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.9036348942576541, "ground_truth": 0}, {"key": "94a9883a283e94c3ad53069d98517b08e8853447", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.7295197803970457, "ground_truth": 0}, {"key": "94a9883a283e94c3ad53069d98517b08e8853447", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.4397473282861568, "ground_truth": 0}, {"key": "9c02ebeda5d84859eb36070de7e8a9517ac3fee6", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.7725306597543351, "ground_truth": 0}, {"key": "9c02ebeda5d84859eb36070de7e8a9517ac3fee6", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.71223217923322, "ground_truth": 0}, {"key": "9c02ebeda5d84859eb36070de7e8a9517ac3fee6", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.7918210664962037, "ground_truth": 0}, {"key": "9c02ebeda5d84859eb36070de7e8a9517ac3fee6", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.4610167957178819, "ground_truth": 0}, {"key": "9c02ebeda5d84859eb36070de7e8a9517ac3fee6", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.5214711636803538, "ground_truth": 0}, {"key": "37ab3a49bb7732e145a24e70e6f077469ca1dbd3", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.8449215316286182, "ground_truth": 0}, {"key": "37ab3a49bb7732e145a24e70e6f077469ca1dbd3", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.6654105605225761, "ground_truth": 0}, {"key": "37ab3a49bb7732e145a24e70e6f077469ca1dbd3", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.47073661189642413, "ground_truth": 0}, {"key": "37ab3a49bb7732e145a24e70e6f077469ca1dbd3", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.4436004169685486, "ground_truth": 0}, {"key": "37ab3a49bb7732e145a24e70e6f077469ca1dbd3", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.5602526689954861, "ground_truth": 0}, {"key": "fa67b52d4597e227947776fd40a4b16f402ed12d", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.5813030618294592, "ground_truth": 0}, {"key": "fa67b52d4597e227947776fd40a4b16f402ed12d", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.21733752347622654, "ground_truth": 0}, {"key": "fa67b52d4597e227947776fd40a4b16f402ed12d", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.15869518751376166, "ground_truth": 0}, {"key": "fa67b52d4597e227947776fd40a4b16f402ed12d", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.22405546664948786, "ground_truth": 0}, {"key": "fa67b52d4597e227947776fd40a4b16f402ed12d", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.338077126456155, "ground_truth": 0}, {"key": "cafb6a9801a85984042abcd7e552d1e129dff4cf", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.35220177460143876, "ground_truth": 0}, {"key": "cafb6a9801a85984042abcd7e552d1e129dff4cf", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.5253688239600902, "ground_truth": 0}, {"key": "cafb6a9801a85984042abcd7e552d1e129dff4cf", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.2628418607222893, "ground_truth": 0}, {"key": "cafb6a9801a85984042abcd7e552d1e129dff4cf", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.3830641923310861, "ground_truth": 0}, {"key": "cafb6a9801a85984042abcd7e552d1e129dff4cf", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.46490157924604963, "ground_truth": 0}, {"key": "12a24b1aba082a5fd0687a14015e1e58090ed9c6", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.15304215484124173, "ground_truth": 0}, {"key": "12a24b1aba082a5fd0687a14015e1e58090ed9c6", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.08850466403783987, "ground_truth": 0}, {"key": "12a24b1aba082a5fd0687a14015e1e58090ed9c6", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.1155608815356003, "ground_truth": 0}, {"key": "12a24b1aba082a5fd0687a14015e1e58090ed9c6", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.046033898199077265, "ground_truth": 0}, {"key": "12a24b1aba082a5fd0687a14015e1e58090ed9c6", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.013636835201034694, "ground_truth": 0}, {"key": "c8ebf6f48257a704202c7b6df238bc1cbfa838d7", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.043042848186802214, "ground_truth": 0}, {"key": "c8ebf6f48257a704202c7b6df238bc1cbfa838d7", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.036220058140451906, "ground_truth": 0}, {"key": "c8ebf6f48257a704202c7b6df238bc1cbfa838d7", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.08035746764834345, "ground_truth": 0}, {"key": "c8ebf6f48257a704202c7b6df238bc1cbfa838d7", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.0913821085682834, "ground_truth": 0}, {"key": "c8ebf6f48257a704202c7b6df238bc1cbfa838d7", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.06536577866634585, "ground_truth": 0}, {"key": "48e858dcb8dd62aad328f2c5f7fa052893d7304b", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.13251457424770213, "ground_truth": 0}, {"key": "48e858dcb8dd62aad328f2c5f7fa052893d7304b", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.1001722275020541, "ground_truth": 0}, {"key": "48e858dcb8dd62aad328f2c5f7fa052893d7304b", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.21076629989287535, "ground_truth": 0}, {"key": "48e858dcb8dd62aad328f2c5f7fa052893d7304b", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.07369627731892847, "ground_truth": 0}, {"key": "48e858dcb8dd62aad328f2c5f7fa052893d7304b", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.12549344937214002, "ground_truth": 0}, {"key": "1522da440cb538c8fc60f254efcb65e8378065a1", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.17781086994334291, "ground_truth": 0}, {"key": "1522da440cb538c8fc60f254efcb65e8378065a1", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.20946969465026818, "ground_truth": 0}, {"key": "1522da440cb538c8fc60f254efcb65e8378065a1", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.2553436527919838, "ground_truth": 0}, {"key": "1522da440cb538c8fc60f254efcb65e8378065a1", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.20055767675965114, "ground_truth": 0}, {"key": "1522da440cb538c8fc60f254efcb65e8378065a1", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.12085324111580914, "ground_truth": 0}, {"key": "0b40c6061cfd6a745886150c46eb75a7f43b4efa", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.015543647283418819, "ground_truth": 0}, {"key": "0b40c6061cfd6a745886150c46eb75a7f43b4efa", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.0397878069148938, "ground_truth": 0}, {"key": "0b40c6061cfd6a745886150c46eb75a7f43b4efa", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.026963499993311504, "ground_truth": 0}, {"key": "0b40c6061cfd6a745886150c46eb75a7f43b4efa", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.0492221171854069, "ground_truth": 0}, {"key": "0b40c6061cfd6a745886150c46eb75a7f43b4efa", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.03817827684271472, "ground_truth": 0}, {"key": "730655d5d1f29496344388805a891c3e3fd2a64e", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.8198933384994294, "ground_truth": 0}, {"key": "730655d5d1f29496344388805a891c3e3fd2a64e", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.7233094667481151, "ground_truth": 0}, {"key": "730655d5d1f29496344388805a891c3e3fd2a64e", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.9458012705282957, "ground_truth": 0}, {"key": "730655d5d1f29496344388805a891c3e3fd2a64e", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.6671476676516687, "ground_truth": 0}, {"key": "730655d5d1f29496344388805a891c3e3fd2a64e", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.7371581538248617, "ground_truth": 0}, {"key": "399877dd5e90d151e29ad67fdeb6fa093632e0e1", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.1835936233348414, "ground_truth": 0}, {"key": "399877dd5e90d151e29ad67fdeb6fa093632e0e1", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.554470459682868, "ground_truth": 0}, {"key": "399877dd5e90d151e29ad67fdeb6fa093632e0e1", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.5117165863208211, "ground_truth": 0}, {"key": "399877dd5e90d151e29ad67fdeb6fa093632e0e1", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.527316528558599, "ground_truth": 0}, {"key": "399877dd5e90d151e29ad67fdeb6fa093632e0e1", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.3090237131811822, "ground_truth": 0}, {"key": "67fc9fa49a2c443dcbab030b9c6247a662716bc9", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.15405755865489318, "ground_truth": 0}, {"key": "67fc9fa49a2c443dcbab030b9c6247a662716bc9", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.10631887680716255, "ground_truth": 0}, {"key": "67fc9fa49a2c443dcbab030b9c6247a662716bc9", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.357567530545921, "ground_truth": 0}, {"key": "67fc9fa49a2c443dcbab030b9c6247a662716bc9", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.4205996079187355, "ground_truth": 0}, {"key": "67fc9fa49a2c443dcbab030b9c6247a662716bc9", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.18952109615985238, "ground_truth": 0}, {"key": "8a44f223fc67ed0d5f946517f77c2291d6c4a027", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.2806163876237115, "ground_truth": 0}, {"key": "8a44f223fc67ed0d5f946517f77c2291d6c4a027", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.26894143767636614, "ground_truth": 0}, {"key": "8a44f223fc67ed0d5f946517f77c2291d6c4a027", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.17441027778894644, "ground_truth": 0}, {"key": "8a44f223fc67ed0d5f946517f77c2291d6c4a027", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.11201595876984512, "ground_truth": 0}, {"key": "8a44f223fc67ed0d5f946517f77c2291d6c4a027", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.39981165655556233, "ground_truth": 0}, {"key": "a3906e4f27942e2742d5cc9a3241980e338e0d30", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.013636836110812792, "ground_truth": 0}, {"key": "a3906e4f27942e2742d5cc9a3241980e338e0d30", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.10669060130300488, "ground_truth": 0}, {"key": "a3906e4f27942e2742d5cc9a3241980e338e0d30", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.026255301268623518, "ground_truth": 0}, {"key": "a3906e4f27942e2742d5cc9a3241980e338e0d30", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.017986210560175162, "ground_truth": 0}, {"key": "a3906e4f27942e2742d5cc9a3241980e338e0d30", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.0064131634785359005, "ground_truth": 0}, {"key": "1e9f089602e8ab42ae65e273d866b53bdf9501bc", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.27357439106582293, "ground_truth": 0}, {"key": "1e9f089602e8ab42ae65e273d866b53bdf9501bc", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.3174262858257719, "ground_truth": 0}, {"key": "1e9f089602e8ab42ae65e273d866b53bdf9501bc", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.11279539456685468, "ground_truth": 0}, {"key": "1e9f089602e8ab42ae65e273d866b53bdf9501bc", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.20817893489586906, "ground_truth": 0}, {"key": "1e9f089602e8ab42ae65e273d866b53bdf9501bc", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.37387582656326546, "ground_truth": 0}, {"key": "768682d2f556e103bad77ad7aaa0660181747d1c", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.694302647173554, "ground_truth": 0}, {"key": "768682d2f556e103bad77ad7aaa0660181747d1c", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.27202457763015186, "ground_truth": 0}, {"key": "768682d2f556e103bad77ad7aaa0660181747d1c", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.3242354013741716, "ground_truth": 0}, {"key": "768682d2f556e103bad77ad7aaa0660181747d1c", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.11838509876600599, "ground_truth": 0}, {"key": "768682d2f556e103bad77ad7aaa0660181747d1c", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.21076629702070546, "ground_truth": 0}, {"key": "2806f716e41ce224a3862eb2bc50e214bc5037d8", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.9284087979037275, "ground_truth": 0}, {"key": "2806f716e41ce224a3862eb2bc50e214bc5037d8", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.9580694729413592, "ground_truth": 0}, {"key": "2806f716e41ce224a3862eb2bc50e214bc5037d8", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.8914335810439735, "ground_truth": 0}, {"key": "2806f716e41ce224a3862eb2bc50e214bc5037d8", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.8643104550545622, "ground_truth": 0}, {"key": "2806f716e41ce224a3862eb2bc50e214bc5037d8", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.9383503783309476, "ground_truth": 0}, {"key": "49d1a193a2c477f5861b593f06681b35b0e49573", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.20434190547525324, "ground_truth": 0}, {"key": "49d1a193a2c477f5861b593f06681b35b0e49573", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.10123347464814364, "ground_truth": 0}, {"key": "49d1a193a2c477f5861b593f06681b35b0e49573", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.17106118296363593, "ground_truth": 0}, {"key": "49d1a193a2c477f5861b593f06681b35b0e49573", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.28140559756277767, "ground_truth": 0}, {"key": "49d1a193a2c477f5861b593f06681b35b0e49573", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.28616925956452405, "ground_truth": 0}, {"key": "d603649af5260edbbe0474bcbb2e83e7340372d3", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.30902371313520227, "ground_truth": 0}, {"key": "d603649af5260edbbe0474bcbb2e83e7340372d3", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.533154392554307, "ground_truth": 0}, {"key": "d603649af5260edbbe0474bcbb2e83e7340372d3", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.8947894592404134, "ground_truth": 0}, {"key": "d603649af5260edbbe0474bcbb2e83e7340372d3", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.4148988356873525, "ground_truth": 0}, {"key": "d603649af5260edbbe0474bcbb2e83e7340372d3", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.5669778400419009, "ground_truth": 0}, {"key": "241c3bfcde3e19fb8f0e5d0273ccb06155a2d86b", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.08035746364726301, "ground_truth": 0}, {"key": "241c3bfcde3e19fb8f0e5d0273ccb06155a2d86b", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.10894504415976886, "ground_truth": 0}, {"key": "241c3bfcde3e19fb8f0e5d0273ccb06155a2d86b", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.10158944684689272, "ground_truth": 0}, {"key": "241c3bfcde3e19fb8f0e5d0273ccb06155a2d86b", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.14854055286682744, "ground_truth": 0}, {"key": "241c3bfcde3e19fb8f0e5d0273ccb06155a2d86b", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.03649376820998509, "ground_truth": 0}, {"key": "cc8898d831bb770da703c284d4a811f16cb4035b", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.01685007879154768, "ground_truth": 0}, {"key": "cc8898d831bb770da703c284d4a811f16cb4035b", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.08945460359288862, "ground_truth": 0}, {"key": "cc8898d831bb770da703c284d4a811f16cb4035b", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.027272668868657337, "ground_truth": 0}, {"key": "cc8898d831bb770da703c284d4a811f16cb4035b", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.024330187945882497, "ground_truth": 0}, {"key": "cc8898d831bb770da703c284d4a811f16cb4035b", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.02987309193239001, "ground_truth": 0}, {"key": "e5685719d330bf84ed7691a9a591e04e6a6226b8", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.014227046138855556, "ground_truth": 0}, {"key": "e5685719d330bf84ed7691a9a591e04e6a6226b8", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.018905446836314847, "ground_truth": 0}, {"key": "e5685719d330bf84ed7691a9a591e04e6a6226b8", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.04008735744992127, "ground_truth": 0}, {"key": "e5685719d330bf84ed7691a9a591e04e6a6226b8", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.018546565463619387, "ground_truth": 0}, {"key": "e5685719d330bf84ed7691a9a591e04e6a6226b8", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.08389038746979331, "ground_truth": 0}, {"key": "bc868bcd37d2463875c4c685c582449069992a76", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.019946935319927923, "ground_truth": 0}, {"key": "bc868bcd37d2463875c4c685c582449069992a76", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.07159119851230004, "ground_truth": 0}, {"key": "bc868bcd37d2463875c4c685c582449069992a76", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.05770531720589133, "ground_truth": 0}, {"key": "bc868bcd37d2463875c4c685c582449069992a76", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.0832919276792094, "ground_truth": 0}, {"key": "bc868bcd37d2463875c4c685c582449069992a76", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.025565213705545695, "ground_truth": 0}, {"key": "c6369011986d295ce197e7304e14b207dab4c0aa", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.4111108574916625, "ground_truth": 0}, {"key": "c6369011986d295ce197e7304e14b207dab4c0aa", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.1666754013682873, "ground_truth": 0}, {"key": "c6369011986d295ce197e7304e14b207dab4c0aa", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.20307463096258604, "ground_truth": 0}, {"key": "c6369011986d295ce197e7304e14b207dab4c0aa", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.261330925848858, "ground_truth": 0}, {"key": "c6369011986d295ce197e7304e14b207dab4c0aa", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.430147344781261, "ground_truth": 0}, {"key": "c4e4f565d15f76b1e367d4fc2e7a2648c3cd395c", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.03832197472456739, "ground_truth": 0}, {"key": "c4e4f565d15f76b1e367d4fc2e7a2648c3cd395c", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.21866936801449402, "ground_truth": 0}, {"key": "c4e4f565d15f76b1e367d4fc2e7a2648c3cd395c", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.1699562416369194, "ground_truth": 0}, {"key": "c4e4f565d15f76b1e367d4fc2e7a2648c3cd395c", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.29828690750073067, "ground_truth": 0}, {"key": "c4e4f565d15f76b1e367d4fc2e7a2648c3cd395c", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.06779314002412648, "ground_truth": 0}, {"key": "32fe9f0f2eedaf63c9fd0314ab92c4b46297e260", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.010652512046501559, "ground_truth": 0}, {"key": "32fe9f0f2eedaf63c9fd0314ab92c4b46297e260", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.013584390902466801, "ground_truth": 0}, {"key": "32fe9f0f2eedaf63c9fd0314ab92c4b46297e260", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.03622005759535097, "ground_truth": 0}, {"key": "32fe9f0f2eedaf63c9fd0314ab92c4b46297e260", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.009559399870364232, "ground_truth": 0}, {"key": "32fe9f0f2eedaf63c9fd0314ab92c4b46297e260", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.01518904937088396, "ground_truth": 0}, {"key": "41698f361bcf6415f711719ed0c2f6817205c091", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.19436782762982052, "ground_truth": 0}, {"key": "41698f361bcf6415f711719ed0c2f6817205c091", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.06441766211171686, "ground_truth": 0}, {"key": "41698f361bcf6415f711719ed0c2f6817205c091", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.09367799978821988, "ground_truth": 0}, {"key": "41698f361bcf6415f711719ed0c2f6817205c091", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.038756194045879995, "ground_truth": 0}, {"key": "41698f361bcf6415f711719ed0c2f6817205c091", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.11838509503339067, "ground_truth": 0}, {"key": "f040d657ee146cd131d34aeb31d6728b4f996666", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.33458945723423605, "ground_truth": 0}, {"key": "f040d657ee146cd131d34aeb31d6728b4f996666", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.7446563457266479, "ground_truth": 0}, {"key": "f040d657ee146cd131d34aeb31d6728b4f996666", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.8025555512695157, "ground_truth": 0}, {"key": "f040d657ee146cd131d34aeb31d6728b4f996666", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.2877678230022851, "ground_truth": 0}, {"key": "f040d657ee146cd131d34aeb31d6728b4f996666", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.8529354685816252, "ground_truth": 0}, {"key": "1823e1e750046606e4be0e8710f1d74998783e41", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.08694165674376635, "ground_truth": 0}, {"key": "1823e1e750046606e4be0e8710f1d74998783e41", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.15203224530011855, "ground_truth": 0}, {"key": "1823e1e750046606e4be0e8710f1d74998783e41", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.1613202343175671, "ground_truth": 0}, {"key": "1823e1e750046606e4be0e8710f1d74998783e41", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.14223188907452539, "ground_truth": 0}, {"key": "1823e1e750046606e4be0e8710f1d74998783e41", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.28616925788248626, "ground_truth": 0}, {"key": "6fae638166ee95509fbab3b28ac1c0ba0b088c79", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.09704754894045672, "ground_truth": 0}, {"key": "6fae638166ee95509fbab3b28ac1c0ba0b088c79", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.1913276911151605, "ground_truth": 0}, {"key": "6fae638166ee95509fbab3b28ac1c0ba0b088c79", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.09301680566454215, "ground_truth": 0}, {"key": "6fae638166ee95509fbab3b28ac1c0ba0b088c79", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.1623800298827411, "ground_truth": 0}, {"key": "6fae638166ee95509fbab3b28ac1c0ba0b088c79", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.05791808832977962, "ground_truth": 0}, {"key": "00be40289d0aea65afd2da6431db8a9fc8efc9c0", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.26435835829701315, "ground_truth": 0}, {"key": "00be40289d0aea65afd2da6431db8a9fc8efc9c0", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.5583269970018995, "ground_truth": 0}, {"key": "00be40289d0aea65afd2da6431db8a9fc8efc9c0", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.7772998529062211, "ground_truth": 0}, {"key": "00be40289d0aea65afd2da6431db8a9fc8efc9c0", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.760650668105062, "ground_truth": 0}, {"key": "00be40289d0aea65afd2da6431db8a9fc8efc9c0", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.5389831980752234, "ground_truth": 0}, {"key": "50dc0ca6cbbd4f9c3761fbb3ad9e7d7ba85bd9b3", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.05877655674631992, "ground_truth": 0}, {"key": "50dc0ca6cbbd4f9c3761fbb3ad9e7d7ba85bd9b3", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.38861801914160626, "ground_truth": 0}, {"key": "50dc0ca6cbbd4f9c3761fbb3ad9e7d7ba85bd9b3", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.08756384388355787, "ground_truth": 0}, {"key": "50dc0ca6cbbd4f9c3761fbb3ad9e7d7ba85bd9b3", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.12808823761242827, "ground_truth": 0}, {"key": "50dc0ca6cbbd4f9c3761fbb3ad9e7d7ba85bd9b3", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.025565210925488073, "ground_truth": 0}, {"key": "28b0e5240a7c3088fc62a70628b146bb40b6b853", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.7872777414352494, "ground_truth": 0}, {"key": "28b0e5240a7c3088fc62a70628b146bb40b6b853", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.6876300052105175, "ground_truth": 0}, {"key": "28b0e5240a7c3088fc62a70628b146bb40b6b853", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.5602526533149965, "ground_truth": 0}, {"key": "28b0e5240a7c3088fc62a70628b146bb40b6b853", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.6169358289940773, "ground_truth": 0}, {"key": "28b0e5240a7c3088fc62a70628b146bb40b6b853", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.9053222943203466, "ground_truth": 0}, {"key": "44bdf9aa9712197110017fca533785653210f1ea", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.36658974015885415, "ground_truth": 0}, {"key": "44bdf9aa9712197110017fca533785653210f1ea", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.7563575438405248, "ground_truth": 0}, {"key": "44bdf9aa9712197110017fca533785653210f1ea", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.27982850196234804, "ground_truth": 0}, {"key": "44bdf9aa9712197110017fca533785653210f1ea", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.697608918780349, "ground_truth": 0}, {"key": "44bdf9aa9712197110017fca533785653210f1ea", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.16830944691114705, "ground_truth": 0}, {"key": "879e68a2b78b3cf3f5c2581bbf6093871143ed7b", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.270480228047745, "ground_truth": 0}, {"key": "879e68a2b78b3cf3f5c2581bbf6093871143ed7b", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.10818896073947472, "ground_truth": 0}, {"key": "879e68a2b78b3cf3f5c2581bbf6093871143ed7b", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.11596071569636397, "ground_truth": 0}, {"key": "879e68a2b78b3cf3f5c2581bbf6093871143ed7b", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.14033624820217805, "ground_truth": 0}, {"key": "879e68a2b78b3cf3f5c2581bbf6093871143ed7b", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.07558478117687804, "ground_truth": 0}, {"key": "980051ddbf137ec06e7aeead2acb598bae388520", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.06853748946350163, "ground_truth": 0}, {"key": "980051ddbf137ec06e7aeead2acb598bae388520", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.026861201544405088, "ground_truth": 0}, {"key": "980051ddbf137ec06e7aeead2acb598bae388520", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.02727266717698, "ground_truth": 0}, {"key": "980051ddbf137ec06e7aeead2acb598bae388520", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.018124719734619082, "ground_truth": 0}, {"key": "980051ddbf137ec06e7aeead2acb598bae388520", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.11920291849169637, "ground_truth": 0}, {"key": "45b9fb89ac2724f2d7de56b2f8c9397bca03326e", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.26359939125105825, "ground_truth": 0}, {"key": "45b9fb89ac2724f2d7de56b2f8c9397bca03326e", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.4455295273438726, "ground_truth": 0}, {"key": "45b9fb89ac2724f2d7de56b2f8c9397bca03326e", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.4649015790380446, "ground_truth": 0}, {"key": "45b9fb89ac2724f2d7de56b2f8c9397bca03326e", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.5983122013288142, "ground_truth": 0}, {"key": "45b9fb89ac2724f2d7de56b2f8c9397bca03326e", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.26664363410686054, "ground_truth": 0}, {"key": "b427165e1be5e9b6e6067fc5f6591c02bfb93333", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.12852513847394625, "ground_truth": 0}, {"key": "b427165e1be5e9b6e6067fc5f6591c02bfb93333", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.0630194703845022, "ground_truth": 0}, {"key": "b427165e1be5e9b6e6067fc5f6591c02bfb93333", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.16132024438337877, "ground_truth": 0}, {"key": "b427165e1be5e9b6e6067fc5f6591c02bfb93333", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.08181270910376666, "ground_truth": 0}, {"key": "b427165e1be5e9b6e6067fc5f6591c02bfb93333", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.12808824760457865, "ground_truth": 0}, {"key": "a9a2880bd65c6b3835d19987ebcbd3d09010a0c3", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.03732688850450675, "ground_truth": 0}, {"key": "a9a2880bd65c6b3835d19987ebcbd3d09010a0c3", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.026657740553120955, "ground_truth": 0}, {"key": "a9a2880bd65c6b3835d19987ebcbd3d09010a0c3", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.04501553305614972, "ground_truth": 0}, {"key": "a9a2880bd65c6b3835d19987ebcbd3d09010a0c3", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.019050899203659412, "ground_truth": 0}, {"key": "a9a2880bd65c6b3835d19987ebcbd3d09010a0c3", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.01461566998793153, "ground_truth": 0}, {"key": "0c67e8d5a91f3c7d9c53e29b8d0a25cf8db21b54", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.0354107274688775, "ground_truth": 0}, {"key": "0c67e8d5a91f3c7d9c53e29b8d0a25cf8db21b54", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.0946776985586334, "ground_truth": 0}, {"key": "0c67e8d5a91f3c7d9c53e29b8d0a25cf8db21b54", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.0341004268580961, "ground_truth": 0}, {"key": "0c67e8d5a91f3c7d9c53e29b8d0a25cf8db21b54", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.1135795811534551, "ground_truth": 0}, {"key": "0c67e8d5a91f3c7d9c53e29b8d0a25cf8db21b54", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.4130035906194594, "ground_truth": 0}, {"key": "bc1c4d12aabdcecab3d87c6f9a898e41c7cd3821", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.4186969226029442, "ground_truth": 0}, {"key": "bc1c4d12aabdcecab3d87c6f9a898e41c7cd3821", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.6486889362277423, "ground_truth": 0}, {"key": "bc1c4d12aabdcecab3d87c6f9a898e41c7cd3821", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.7287482948694735, "ground_truth": 0}, {"key": "bc1c4d12aabdcecab3d87c6f9a898e41c7cd3821", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.49023561230738905, "ground_truth": 0}, {"key": "bc1c4d12aabdcecab3d87c6f9a898e41c7cd3821", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.39606817096345004, "ground_truth": 0}, {"key": "7b76a0b5e6006587b65ad70ac2e4953ca1e2d4d1", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.021698099761584787, "ground_truth": 0}, {"key": "7b76a0b5e6006587b65ad70ac2e4953ca1e2d4d1", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.021532877390774453, "ground_truth": 0}, {"key": "7b76a0b5e6006587b65ad70ac2e4953ca1e2d4d1", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.04320403239903499, "ground_truth": 0}, {"key": "7b76a0b5e6006587b65ad70ac2e4953ca1e2d4d1", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.012100386390910272, "ground_truth": 0}, {"key": "7b76a0b5e6006587b65ad70ac2e4953ca1e2d4d1", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.016593178115916284, "ground_truth": 0}, {"key": "8a0976b5b0811c919669e8aed7274e1d0fa14679", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.48438007898766194, "ground_truth": 0}, {"key": "8a0976b5b0811c919669e8aed7274e1d0fa14679", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.3793783963326239, "ground_truth": 0}, {"key": "8a0976b5b0811c919669e8aed7274e1d0fa14679", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.6406358651127912, "ground_truth": 0}, {"key": "8a0976b5b0811c919669e8aed7274e1d0fa14679", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.30074558040260674, "ground_truth": 0}, {"key": "8a0976b5b0811c919669e8aed7274e1d0fa14679", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.677473999860348, "ground_truth": 0}, {"key": "69788d586d71bf36d2818ca097308747f6ab25ab", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.25386101903370567, "ground_truth": 0}, {"key": "69788d586d71bf36d2818ca097308747f6ab25ab", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.2689414417886525, "ground_truth": 0}, {"key": "69788d586d71bf36d2818ca097308747f6ab25ab", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.3191213890661727, "ground_truth": 0}, {"key": "69788d586d71bf36d2818ca097308747f6ab25ab", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.18010666089524113, "ground_truth": 0}, {"key": "69788d586d71bf36d2818ca097308747f6ab25ab", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.386763422298826, "ground_truth": 0}, {"key": "82e9c77478dfed129ceca1a152ba54e20f7f5a88", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.1744102689365414, "ground_truth": 0}, {"key": "82e9c77478dfed129ceca1a152ba54e20f7f5a88", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.14706451992047367, "ground_truth": 0}, {"key": "82e9c77478dfed129ceca1a152ba54e20f7f5a88", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.29259529608016493, "ground_truth": 0}, {"key": "82e9c77478dfed129ceca1a152ba54e20f7f5a88", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.12252321207530496, "ground_truth": 0}, {"key": "82e9c77478dfed129ceca1a152ba54e20f7f5a88", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.22135069543341881, "ground_truth": 0}, {"key": "e1b904fd0a3f74c3e01831acb6d4a67c0d1b642b", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.0894545981590336, "ground_truth": 0}, {"key": "e1b904fd0a3f74c3e01831acb6d4a67c0d1b642b", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.08329192850859549, "ground_truth": 0}, {"key": "e1b904fd0a3f74c3e01831acb6d4a67c0d1b642b", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.06465349043542924, "ground_truth": 0}, {"key": "e1b904fd0a3f74c3e01831acb6d4a67c0d1b642b", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.07369627087056702, "ground_truth": 0}, {"key": "e1b904fd0a3f74c3e01831acb6d4a67c0d1b642b", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.17895589360234487, "ground_truth": 0}, {"key": "1cecb5f24805afcc15eb5cfa0500130f107c8bcb", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.08570928047782367, "ground_truth": 0}, {"key": "1cecb5f24805afcc15eb5cfa0500130f107c8bcb", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.1597410245652272, "ground_truth": 0}, {"key": "1cecb5f24805afcc15eb5cfa0500130f107c8bcb", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.11357957826077485, "ground_truth": 0}, {"key": "1cecb5f24805afcc15eb5cfa0500130f107c8bcb", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.2546016346961678, "ground_truth": 0}, {"key": "1cecb5f24805afcc15eb5cfa0500130f107c8bcb", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.11757213546092235, "ground_truth": 0}, {"key": "d3da69405b687367de6260d74db8726423b6884a", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.637030796180351, "ground_truth": 0}, {"key": "d3da69405b687367de6260d74db8726423b6884a", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.3293916981350368, "ground_truth": 0}, {"key": "d3da69405b687367de6260d74db8726423b6884a", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.26740816225065783, "ground_truth": 0}, {"key": "d3da69405b687367de6260d74db8726423b6884a", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.42441200278130425, "ground_truth": 0}, {"key": "d3da69405b687367de6260d74db8726423b6884a", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.12678517688148752, "ground_truth": 0}, {"key": "9b7836ba179053fecec671168589694bd4ba08f1", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.5794003893020752, "ground_truth": 0}, {"key": "9b7836ba179053fecec671168589694bd4ba08f1", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.7431679837657122, "ground_truth": 0}, {"key": "9b7836ba179053fecec671168589694bd4ba08f1", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.85488463727756, "ground_truth": 0}, {"key": "9b7836ba179053fecec671168589694bd4ba08f1", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.8438951067324436, "ground_truth": 0}, {"key": "9b7836ba179053fecec671168589694bd4ba08f1", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.6992544439771842, "ground_truth": 0}, {"key": "9483ae6d83dd71a96e91eee727a9ce7c0f3cf6ab", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.9416541611199644, "ground_truth": 0}, {"key": "9483ae6d83dd71a96e91eee727a9ce7c0f3cf6ab", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.9329437153342605, "ground_truth": 0}, {"key": "9483ae6d83dd71a96e91eee727a9ce7c0f3cf6ab", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.8311430347258527, "ground_truth": 0}, {"key": "9483ae6d83dd71a96e91eee727a9ce7c0f3cf6ab", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.9443823889814069, "ground_truth": 0}, {"key": "9483ae6d83dd71a96e91eee727a9ce7c0f3cf6ab", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.8365545609599174, "ground_truth": 0}, {"key": "ea29e498c303964fc39c856ddf7037d5dfbc93fb", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.19682621800603228, "ground_truth": 0}, {"key": "ea29e498c303964fc39c856ddf7037d5dfbc93fb", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.7613610901920157, "ground_truth": 0}, {"key": "ea29e498c303964fc39c856ddf7037d5dfbc93fb", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.38861801400118245, "ground_truth": 0}, {"key": "ea29e498c303964fc39c856ddf7037d5dfbc93fb", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.7130321316777649, "ground_truth": 0}, {"key": "ea29e498c303964fc39c856ddf7037d5dfbc93fb", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.40168780053752995, "ground_truth": 0}, {"key": "e1aad9da59a32a4443010b092eba1b68725c8467", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.015483988695640728, "ground_truth": 0}, {"key": "e1aad9da59a32a4443010b092eba1b68725c8467", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.005774930070749782, "ground_truth": 0}, {"key": "e1aad9da59a32a4443010b092eba1b68725c8467", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.007815889166620673, "ground_truth": 0}, {"key": "e1aad9da59a32a4443010b092eba1b68725c8467", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.09301680935966476, "ground_truth": 0}, {"key": "e1aad9da59a32a4443010b092eba1b68725c8467", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.006026951530864936, "ground_truth": 0}, {"key": "6897f34c8e510dc95524dbfceefe20717776f761", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.4092207813296234, "ground_truth": 0}, {"key": "6897f34c8e510dc95524dbfceefe20717776f761", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.6039318430819179, "ground_truth": 0}, {"key": "6897f34c8e510dc95524dbfceefe20717776f761", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.3504213682664395, "ground_truth": 0}, {"key": "6897f34c8e510dc95524dbfceefe20717776f761", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.3979384387280457, "ground_truth": 0}, {"key": "6897f34c8e510dc95524dbfceefe20717776f761", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.3328523206548507, "ground_truth": 0}, {"key": "c0846f0148c9fd60433c8d2bf85e3437b49f9ec4", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.2674081555983974, "ground_truth": 0}, {"key": "c0846f0148c9fd60433c8d2bf85e3437b49f9ec4", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.08882028898442161, "ground_truth": 0}, {"key": "c0846f0148c9fd60433c8d2bf85e3437b49f9ec4", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.032961243119732586, "ground_truth": 0}, {"key": "c0846f0148c9fd60433c8d2bf85e3437b49f9ec4", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.11279540592622479, "ground_truth": 0}, {"key": "c0846f0148c9fd60433c8d2bf85e3437b49f9ec4", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.03690806685983835, "ground_truth": 0}, {"key": "dfbb5a2d5844f89537141a2b5a48040e68327010", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.1470645232081679, "ground_truth": 0}, {"key": "dfbb5a2d5844f89537141a2b5a48040e68327010", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.060086649398876854, "ground_truth": 0}, {"key": "dfbb5a2d5844f89537141a2b5a48040e68327010", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.21206880618309845, "ground_truth": 0}, {"key": "dfbb5a2d5844f89537141a2b5a48040e68327010", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.08756384519525262, "ground_truth": 0}, {"key": "dfbb5a2d5844f89537141a2b5a48040e68327010", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.09947021611623277, "ground_truth": 0}, {"key": "0aa0562353120d93357dc00a05ff4d2bc0312715", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.03846619298370347, "ground_truth": 0}, {"key": "0aa0562353120d93357dc00a05ff4d2bc0312715", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.05014425544248823, "ground_truth": 0}, {"key": "0aa0562353120d93357dc00a05ff4d2bc0312715", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.031858856538534534, "ground_truth": 0}, {"key": "0aa0562353120d93357dc00a05ff4d2bc0312715", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.06187598853317955, "ground_truth": 0}, {"key": "0aa0562353120d93357dc00a05ff4d2bc0312715", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.05770531426752715, "ground_truth": 0}, {"key": "fd5ae29a3ed2e9093c12dcbb12fcb5c67217b0f5", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.2240554568559307, "ground_truth": 0}, {"key": "fd5ae29a3ed2e9093c12dcbb12fcb5c67217b0f5", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.19436782731246013, "ground_truth": 0}, {"key": "fd5ae29a3ed2e9093c12dcbb12fcb5c67217b0f5", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.17667160889537137, "ground_truth": 0}, {"key": "fd5ae29a3ed2e9093c12dcbb12fcb5c67217b0f5", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.21601152424338332, "ground_truth": 0}, {"key": "fd5ae29a3ed2e9093c12dcbb12fcb5c67217b0f5", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.24364245914553062, "ground_truth": 0}, {"key": "4df7a53f5e24347a53d5bf3b8c92bef21561f2c4", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.023509452169017873, "ground_truth": 0}, {"key": "4df7a53f5e24347a53d5bf3b8c92bef21561f2c4", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.014337030959605557, "ground_truth": 0}, {"key": "4df7a53f5e24347a53d5bf3b8c92bef21561f2c4", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.009746103691055443, "ground_truth": 0}, {"key": "4df7a53f5e24347a53d5bf3b8c92bef21561f2c4", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.020804490271848428, "ground_truth": 0}, {"key": "4df7a53f5e24347a53d5bf3b8c92bef21561f2c4", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.0651275473733897, "ground_truth": 0}, {"key": "166fe0c3d3f400a48ec5fd716c675384512f152c", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.2351083855360555, "ground_truth": 0}, {"key": "166fe0c3d3f400a48ec5fd716c675384512f152c", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.09877259001099555, "ground_truth": 0}, {"key": "166fe0c3d3f400a48ec5fd716c675384512f152c", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.24077460366785244, "ground_truth": 0}, {"key": "166fe0c3d3f400a48ec5fd716c675384512f152c", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.08882029184602928, "ground_truth": 0}, {"key": "166fe0c3d3f400a48ec5fd716c675384512f152c", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.23161424446371584, "ground_truth": 0}, {"key": "69e313e0e6e7603f96a3783cb7d1ada68ace288f", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.38121957221484, "ground_truth": 0}, {"key": "69e313e0e6e7603f96a3783cb7d1ada68ace288f", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.05460060644199868, "ground_truth": 0}, {"key": "69e313e0e6e7603f96a3783cb7d1ada68ace288f", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.22953521752981448, "ground_truth": 0}, {"key": "69e313e0e6e7603f96a3783cb7d1ada68ace288f", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.25386100971725817, "ground_truth": 0}, {"key": "69e313e0e6e7603f96a3783cb7d1ada68ace288f", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.12506538051062613, "ground_truth": 0}, {"key": "21ff7b91537b3ab2e73dff1f982a669b8658b0e9", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.02080448958083282, "ground_truth": 0}, {"key": "21ff7b91537b3ab2e73dff1f982a669b8658b0e9", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.007011795606500873, "ground_truth": 0}, {"key": "21ff7b91537b3ab2e73dff1f982a669b8658b0e9", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.0163401281803119, "ground_truth": 0}, {"key": "21ff7b91537b3ab2e73dff1f982a669b8658b0e9", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.007460643216682591, "ground_truth": 0}, {"key": "21ff7b91537b3ab2e73dff1f982a669b8658b0e9", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.0339719988319458, "ground_truth": 0}, {"key": "963cbc7820b42eaa7b7a82d178c6a387a70a6a3c", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.18713268075770653, "ground_truth": 0}, {"key": "963cbc7820b42eaa7b7a82d178c6a387a70a6a3c", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.16451645930465517, "ground_truth": 0}, {"key": "963cbc7820b42eaa7b7a82d178c6a387a70a6a3c", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.028436032137974732, "ground_truth": 0}, {"key": "963cbc7820b42eaa7b7a82d178c6a387a70a6a3c", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.13939638673539365, "ground_truth": 0}, {"key": "963cbc7820b42eaa7b7a82d178c6a387a70a6a3c", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.20561505006031533, "ground_truth": 0}, {"key": "8180a77657661e975e3fac6c7fdbd8de97fd160e", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.5467381470394153, "ground_truth": 0}, {"key": "8180a77657661e975e3fac6c7fdbd8de97fd160e", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.7669924724686726, "ground_truth": 0}, {"key": "8180a77657661e975e3fac6c7fdbd8de97fd160e", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.6495786112340918, "ground_truth": 0}, {"key": "8180a77657661e975e3fac6c7fdbd8de97fd160e", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.8852352240536102, "ground_truth": 0}, {"key": "8180a77657661e975e3fac6c7fdbd8de97fd160e", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.4824291057346916, "ground_truth": 0}, {"key": "6c498fd6de7ad5e5006732655050c1d97cc2af68", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.49218813465242556, "ground_truth": 0}, {"key": "6c498fd6de7ad5e5006732655050c1d97cc2af68", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.23231015381742232, "ground_truth": 0}, {"key": "6c498fd6de7ad5e5006732655050c1d97cc2af68", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.12549344965550668, "ground_truth": 0}, {"key": "6c498fd6de7ad5e5006732655050c1d97cc2af68", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.08181270910523564, "ground_truth": 0}, {"key": "6c498fd6de7ad5e5006732655050c1d97cc2af68", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.188323985585335, "ground_truth": 0}, {"key": "fdb54e157f8f4e5a479dbc6288587e52fffde33f", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.13846179594751407, "ground_truth": 0}, {"key": "fdb54e157f8f4e5a479dbc6288587e52fffde33f", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.6076631530786734, "ground_truth": 0}, {"key": "fdb54e157f8f4e5a479dbc6288587e52fffde33f", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.38491212855995843, "ground_truth": 0}, {"key": "fdb54e157f8f4e5a479dbc6288587e52fffde33f", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.11797801135329399, "ground_truth": 0}, {"key": "fdb54e157f8f4e5a479dbc6288587e52fffde33f", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.2598256522169657, "ground_truth": 0}, {"key": "fc8f0e54e2627ebe705735f0565d77ca64579d92", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.3575675376023244, "ground_truth": 0}, {"key": "fc8f0e54e2627ebe705735f0565d77ca64579d92", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.055823142036876876, "ground_truth": 0}, {"key": "fc8f0e54e2627ebe705735f0565d77ca64579d92", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.10052486388193357, "ground_truth": 0}, {"key": "fc8f0e54e2627ebe705735f0565d77ca64579d92", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.06210312264053622, "ground_truth": 0}, {"key": "fc8f0e54e2627ebe705735f0565d77ca64579d92", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.039638840331426325, "ground_truth": 0}, {"key": "b000d4eac990440e136dc1e655a03d5669531d9b", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.8577681148459905, "ground_truth": 0}, {"key": "b000d4eac990440e136dc1e655a03d5669531d9b", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.743168000818503, "ground_truth": 0}, {"key": "b000d4eac990440e136dc1e655a03d5669531d9b", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.8098781695537329, "ground_truth": 0}, {"key": "b000d4eac990440e136dc1e655a03d5669531d9b", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.7599387704810668, "ground_truth": 0}, {"key": "b000d4eac990440e136dc1e655a03d5669531d9b", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.6654105676912053, "ground_truth": 0}, {"key": "1064c47f3d7f0efa03368fe7eb01dd0836017339", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.3328523272454778, "ground_truth": 0}, {"key": "1064c47f3d7f0efa03368fe7eb01dd0836017339", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.05184546806142136, "ground_truth": 0}, {"key": "1064c47f3d7f0efa03368fe7eb01dd0836017339", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.05791808860165403, "ground_truth": 0}, {"key": "1064c47f3d7f0efa03368fe7eb01dd0836017339", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.045015534701037606, "ground_truth": 0}, {"key": "1064c47f3d7f0efa03368fe7eb01dd0836017339", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.31573598325999247, "ground_truth": 0}, {"key": "d79f1e9a2ddfcb61d80c944de53daebd4b5c7f6e", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.08093670665607167, "ground_truth": 0}, {"key": "d79f1e9a2ddfcb61d80c944de53daebd4b5c7f6e", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.08035746701042056, "ground_truth": 0}, {"key": "d79f1e9a2ddfcb61d80c944de53daebd4b5c7f6e", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.06233103760550683, "ground_truth": 0}, {"key": "d79f1e9a2ddfcb61d80c944de53daebd4b5c7f6e", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.03846619505353644, "ground_truth": 0}, {"key": "d79f1e9a2ddfcb61d80c944de53daebd4b5c7f6e", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.12043881420389871, "ground_truth": 0}, {"key": "87b5f1f872c849ec239bad4ccf487d048d4274b2", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.6740504547658176, "ground_truth": 0}, {"key": "87b5f1f872c849ec239bad4ccf487d048d4274b2", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.9190632855001977, "ground_truth": 0}, {"key": "87b5f1f872c849ec239bad4ccf487d048d4274b2", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.8128673106152217, "ground_truth": 0}, {"key": "87b5f1f872c849ec239bad4ccf487d048d4274b2", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.712232172169222, "ground_truth": 0}, {"key": "87b5f1f872c849ec239bad4ccf487d048d4274b2", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.7570766872788965, "ground_truth": 0}, {"key": "9ea6d6a5cae86243c1c8899f7bab76e874c73b38", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.2982869037531717, "ground_truth": 0}, {"key": "9ea6d6a5cae86243c1c8899f7bab76e874c73b38", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.2605775780968892, "ground_truth": 0}, {"key": "9ea6d6a5cae86243c1c8899f7bab76e874c73b38", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.5860491176180063, "ground_truth": 0}, {"key": "9ea6d6a5cae86243c1c8899f7bab76e874c73b38", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.35577488034742016, "ground_truth": 0}, {"key": "9ea6d6a5cae86243c1c8899f7bab76e874c73b38", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.3793783992365812, "ground_truth": 0}, {"key": "a3cb529364dbdcd2af9e30ecfe56898be375870b", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.010570488827446775, "ground_truth": 0}, {"key": "a3cb529364dbdcd2af9e30ecfe56898be375870b", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.08756383660980584, "ground_truth": 0}, {"key": "a3cb529364dbdcd2af9e30ecfe56898be375870b", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.0627892057446844, "ground_truth": 0}, {"key": "a3cb529364dbdcd2af9e30ecfe56898be375870b", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.05770531147828372, "ground_truth": 0}, {"key": "a3cb529364dbdcd2af9e30ecfe56898be375870b", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.01120121437389046, "ground_truth": 0}, {"key": "f489b07406c653968a0ed21c00e28c9124e4a49b", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.20181321766083393, "ground_truth": 0}, {"key": "f489b07406c653968a0ed21c00e28c9124e4a49b", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.06853749743371064, "ground_truth": 0}, {"key": "f489b07406c653968a0ed21c00e28c9124e4a49b", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.1490353113575977, "ground_truth": 0}, {"key": "f489b07406c653968a0ed21c00e28c9124e4a49b", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.28140560068827625, "ground_truth": 0}, {"key": "f489b07406c653968a0ed21c00e28c9124e4a49b", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.05582314192146915, "ground_truth": 0}, {"key": "499fdb9bf024f6fbfd605792594372df22ec12f0", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.3380771316944342, "ground_truth": 0}, {"key": "499fdb9bf024f6fbfd605792594372df22ec12f0", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.11008788647073442, "ground_truth": 0}, {"key": "499fdb9bf024f6fbfd605792594372df22ec12f0", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.1485405557114791, "ground_truth": 0}, {"key": "499fdb9bf024f6fbfd605792594372df22ec12f0", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.1263533378816431, "ground_truth": 0}, {"key": "499fdb9bf024f6fbfd605792594372df22ec12f0", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.1490352951162516, "ground_truth": 0}, {"key": "9f49bf7ded4308f1601e4723d594d7c3b4883b32", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.04099902834345415, "ground_truth": 0}, {"key": "9f49bf7ded4308f1601e4723d594d7c3b4883b32", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.028114056759718654, "ground_truth": 0}, {"key": "9f49bf7ded4308f1601e4723d594d7c3b4883b32", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.10230470467735107, "ground_truth": 0}, {"key": "9f49bf7ded4308f1601e4723d594d7c3b4883b32", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.34422296665450636, "ground_truth": 0}, {"key": "9f49bf7ded4308f1601e4723d594d7c3b4883b32", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.154057571277643, "ground_truth": 0}, {"key": "6bd843fe975d42b0f2d5eedb1a02d918e4a397f5", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.037608634122193445, "ground_truth": 0}, {"key": "6bd843fe975d42b0f2d5eedb1a02d918e4a397f5", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.16995623441819527, "ground_truth": 0}, {"key": "6bd843fe975d42b0f2d5eedb1a02d918e4a397f5", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.062331039048771304, "ground_truth": 0}, {"key": "6bd843fe975d42b0f2d5eedb1a02d918e4a397f5", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.4902356071707402, "ground_truth": 0}, {"key": "6bd843fe975d42b0f2d5eedb1a02d918e4a397f5", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.24077460276050094, "ground_truth": 0}, {"key": "00aa8e3ba59f5fe71a096a5549f80faece10aa83", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.029986506102413536, "ground_truth": 0}, {"key": "00aa8e3ba59f5fe71a096a5549f80faece10aa83", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.1233656131086522, "ground_truth": 0}, {"key": "00aa8e3ba59f5fe71a096a5549f80faece10aa83", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.04023794458694684, "ground_truth": 0}, {"key": "00aa8e3ba59f5fe71a096a5549f80faece10aa83", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.06278920706999801, "ground_truth": 0}, {"key": "00aa8e3ba59f5fe71a096a5549f80faece10aa83", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.05964694148130452, "ground_truth": 0}, {"key": "bf0ea0373655184f69fb01b9aa833d21e7188e9e", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.3380771475001853, "ground_truth": 0}, {"key": "bf0ea0373655184f69fb01b9aa833d21e7188e9e", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.6206215969258679, "ground_truth": 0}, {"key": "bf0ea0373655184f69fb01b9aa833d21e7188e9e", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.2974699448250727, "ground_truth": 0}, {"key": "bf0ea0373655184f69fb01b9aa833d21e7188e9e", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.4263215903953759, "ground_truth": 0}, {"key": "bf0ea0373655184f69fb01b9aa833d21e7188e9e", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.4610167932349819, "ground_truth": 0}, {"key": "e1afe080ecf3565b0103214c21f49e8b03741024", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.009974921337652331, "ground_truth": 0}, {"key": "e1afe080ecf3565b0103214c21f49e8b03741024", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.01627746186644526, "ground_truth": 0}, {"key": "e1afe080ecf3565b0103214c21f49e8b03741024", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.013902058765386917, "ground_truth": 0}, {"key": "e1afe080ecf3565b0103214c21f49e8b03741024", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.04161779516664762, "ground_truth": 0}, {"key": "e1afe080ecf3565b0103214c21f49e8b03741024", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.010052368927695489, "ground_truth": 0}, {"key": "05fa6152f08a3d64745030124428775768ee3afd", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.5292633867247986, "ground_truth": 0}, {"key": "05fa6152f08a3d64745030124428775768ee3afd", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.49414088999145084, "ground_truth": 0}, {"key": "05fa6152f08a3d64745030124428775768ee3afd", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.537041389224615, "ground_truth": 0}, {"key": "05fa6152f08a3d64745030124428775768ee3afd", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.32082131826223603, "ground_truth": 0}, {"key": "05fa6152f08a3d64745030124428775768ee3afd", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.39793842328237444, "ground_truth": 0}, {"key": "8f80054060e5c2dde57666b5e3bddf6b70b34f3f", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.42250462559305185, "ground_truth": 0}, {"key": "8f80054060e5c2dde57666b5e3bddf6b70b34f3f", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.57558800340089, "ground_truth": 0}, {"key": "8f80054060e5c2dde57666b5e3bddf6b70b34f3f", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.5945512573143961, "ground_truth": 0}, {"key": "8f80054060e5c2dde57666b5e3bddf6b70b34f3f", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.6039318344651562, "ground_truth": 0}, {"key": "8f80054060e5c2dde57666b5e3bddf6b70b34f3f", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.5506073687399334, "ground_truth": 0}, {"key": "f63877ffefceaf9a2a13a9277f4d861f9b9b8a73", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.09203285928704935, "ground_truth": 0}, {"key": "f63877ffefceaf9a2a13a9277f4d861f9b9b8a73", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.044847906349587525, "ground_truth": 0}, {"key": "f63877ffefceaf9a2a13a9277f4d861f9b9b8a73", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.14755517945269508, "ground_truth": 0}, {"key": "f63877ffefceaf9a2a13a9277f4d861f9b9b8a73", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.13986564163303303, "ground_truth": 0}, {"key": "f63877ffefceaf9a2a13a9277f4d861f9b9b8a73", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.12765262397649974, "ground_truth": 0}, {"key": "e1e0fbee1f5df559fda3830710afb660f33cb7b5", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.03817827480123201, "ground_truth": 0}, {"key": "e1e0fbee1f5df559fda3830710afb660f33cb7b5", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.01287074944248834, "ground_truth": 0}, {"key": "e1e0fbee1f5df559fda3830710afb660f33cb7b5", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.01115803052988263, "ground_truth": 0}, {"key": "e1e0fbee1f5df559fda3830710afb660f33cb7b5", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.0225429660767754, "ground_truth": 0}, {"key": "e1e0fbee1f5df559fda3830710afb660f33cb7b5", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.029873091808645304, "ground_truth": 0}, {"key": "7d66246dc75062c5616067bbb379962c3934e52f", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.44746030233925327, "ground_truth": 0}, {"key": "7d66246dc75062c5616067bbb379962c3934e52f", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.33807713078740287, "ground_truth": 0}, {"key": "7d66246dc75062c5616067bbb379962c3934e52f", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.521471165224141, "ground_truth": 0}, {"key": "7d66246dc75062c5616067bbb379962c3934e52f", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.6039318239915079, "ground_truth": 0}, {"key": "7d66246dc75062c5616067bbb379962c3934e52f", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.5409238496366731, "ground_truth": 0}, {"key": "09e62b334425ef4eee26be483a625858c91340eb", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.02716923250085705, "ground_truth": 0}, {"key": "09e62b334425ef4eee26be483a625858c91340eb", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.15152935123666467, "ground_truth": 0}, {"key": "09e62b334425ef4eee26be483a625858c91340eb", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.04922211415436599, "ground_truth": 0}, {"key": "09e62b334425ef4eee26be483a625858c91340eb", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.07585817742675051, "ground_truth": 0}, {"key": "09e62b334425ef4eee26be483a625858c91340eb", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.04146227242462516, "ground_truth": 0}, {"key": "32e769b0ced3ffbf79f695af69a2401897156c8c", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.1384617937191307, "ground_truth": 0}, {"key": "32e769b0ced3ffbf79f695af69a2401897156c8c", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.28298812230865716, "ground_truth": 0}, {"key": "32e769b0ced3ffbf79f695af69a2401897156c8c", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.2107662880338577, "ground_truth": 0}, {"key": "32e769b0ced3ffbf79f695af69a2401897156c8c", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.2766905126652254, "ground_truth": 0}, {"key": "32e769b0ced3ffbf79f695af69a2401897156c8c", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.08329192755695074, "ground_truth": 0}, {"key": "43d42fe40ada4406377bc3b45c123a75552c21a0", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.46101679766477216, "ground_truth": 0}, {"key": "43d42fe40ada4406377bc3b45c123a75552c21a0", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.8019358207039663, "ground_truth": 0}, {"key": "43d42fe40ada4406377bc3b45c123a75552c21a0", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.6817267747141805, "ground_truth": 0}, {"key": "43d42fe40ada4406377bc3b45c123a75552c21a0", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.6132365612167885, "ground_truth": 0}, {"key": "43d42fe40ada4406377bc3b45c123a75552c21a0", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.4590761461510044, "ground_truth": 0}, {"key": "cec3e977a612e1481913d63934cfe578b9bcf3be", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.08694165396906374, "ground_truth": 0}, {"key": "cec3e977a612e1481913d63934cfe578b9bcf3be", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.47463118494924567, "ground_truth": 0}, {"key": "cec3e977a612e1481913d63934cfe578b9bcf3be", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.1520322496321914, "ground_truth": 0}, {"key": "cec3e977a612e1481913d63934cfe578b9bcf3be", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.13660839083472578, "ground_truth": 0}, {"key": "cec3e977a612e1481913d63934cfe578b9bcf3be", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.04518375341980065, "ground_truth": 0}, {"key": "2572185d9544f23c4ad02aeac1ae8ab7828fb4be", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.125922763501045, "ground_truth": 0}, {"key": "2572185d9544f23c4ad02aeac1ae8ab7828fb4be", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.09602549442346439, "ground_truth": 0}, {"key": "2572185d9544f23c4ad02aeac1ae8ab7828fb4be", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.19436782522630563, "ground_truth": 0}, {"key": "2572185d9544f23c4ad02aeac1ae8ab7828fb4be", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.08882029560301018, "ground_truth": 0}, {"key": "2572185d9544f23c4ad02aeac1ae8ab7828fb4be", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.3007455803579298, "ground_truth": 0}, {"key": "3cc7c9639fb87922cfac315fbb55641e671a3d99", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.2436424537721821, "ground_truth": 0}, {"key": "3cc7c9639fb87922cfac315fbb55641e671a3d99", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.5506073704069459, "ground_truth": 0}, {"key": "3cc7c9639fb87922cfac315fbb55641e671a3d99", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.4493926477233821, "ground_truth": 0}, {"key": "3cc7c9639fb87922cfac315fbb55641e671a3d99", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.2133771802962961, "ground_truth": 0}, {"key": "3cc7c9639fb87922cfac315fbb55641e671a3d99", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.1968261996976293, "ground_truth": 0}, {"key": "374ae10f9cbb0719c889321f880a0671892336e4", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.9871787853080621, "ground_truth": 0}, {"key": "374ae10f9cbb0719c889321f880a0671892336e4", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.9623913637523488, "ground_truth": 0}, {"key": "374ae10f9cbb0719c889321f880a0671892336e4", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.7704647936441241, "ground_truth": 0}, {"key": "374ae10f9cbb0719c889321f880a0671892336e4", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.9936116792822879, "ground_truth": 0}, {"key": "374ae10f9cbb0719c889321f880a0671892336e4", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.9628132243987023, "ground_truth": 0}, {"key": "89a7bb5a0b120c5b50e9145c8f8f9bea3a90371a", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.5253688009780509, "ground_truth": 0}, {"key": "89a7bb5a0b120c5b50e9145c8f8f9bea3a90371a", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.7209580372472328, "ground_truth": 0}, {"key": "89a7bb5a0b120c5b50e9145c8f8f9bea3a90371a", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.7759445365938347, "ground_truth": 0}, {"key": "89a7bb5a0b120c5b50e9145c8f8f9bea3a90371a", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.5175709247987309, "ground_truth": 0}, {"key": "89a7bb5a0b120c5b50e9145c8f8f9bea3a90371a", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.4941408978308046, "ground_truth": 0}, {"key": "49d4ad731a44b7576e3e3271b1eee2f0219883c2", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.06052938923066534, "ground_truth": 0}, {"key": "49d4ad731a44b7576e3e3271b1eee2f0219883c2", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.09138210347958785, "ground_truth": 0}, {"key": "49d4ad731a44b7576e3e3271b1eee2f0219883c2", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.04707417842664413, "ground_truth": 0}, {"key": "49d4ad731a44b7576e3e3271b1eee2f0219883c2", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.04084571693867325, "ground_truth": 0}, {"key": "49d4ad731a44b7576e3e3271b1eee2f0219883c2", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.04885778165798384, "ground_truth": 0}, {"key": "ab3c9bac8bcfef89da719c4aba8ea4eee71e4daf", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.6261241898362694, "ground_truth": 0}, {"key": "ab3c9bac8bcfef89da719c4aba8ea4eee71e4daf", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.3867634537823966, "ground_truth": 0}, {"key": "ab3c9bac8bcfef89da719c4aba8ea4eee71e4daf", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.4339814942152474, "ground_truth": 0}, {"key": "ab3c9bac8bcfef89da719c4aba8ea4eee71e4daf", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.39420093263001255, "ground_truth": 0}, {"key": "ab3c9bac8bcfef89da719c4aba8ea4eee71e4daf", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.6085940630379829, "ground_truth": 0}, {"key": "eb8b1cf7cf4ab7ad23ef6094cfe69348563aecc8", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.15102779642398084, "ground_truth": 0}, {"key": "eb8b1cf7cf4ab7ad23ef6094cfe69348563aecc8", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.0926877828483294, "ground_truth": 0}, {"key": "eb8b1cf7cf4ab7ad23ef6094cfe69348563aecc8", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.23231015574359934, "ground_truth": 0}, {"key": "eb8b1cf7cf4ab7ad23ef6094cfe69348563aecc8", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.18594720745427665, "ground_truth": 0}, {"key": "eb8b1cf7cf4ab7ad23ef6094cfe69348563aecc8", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.2798285187222346, "ground_truth": 0}, {"key": "e944a5cbd4265e43f422c172b930a60b7de190cc", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.17441027947220558, "ground_truth": 0}, {"key": "e944a5cbd4265e43f422c172b930a60b7de190cc", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.44939265121018607, "ground_truth": 0}, {"key": "e944a5cbd4265e43f422c172b930a60b7de190cc", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.24508500561803653, "ground_truth": 0}, {"key": "e944a5cbd4265e43f422c172b930a60b7de190cc", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.2845760074260129, "ground_truth": 0}, {"key": "e944a5cbd4265e43f422c172b930a60b7de190cc", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.09301680453557287, "ground_truth": 0}, {"key": "ef96a6c54daaf4fef676a69305e26fa1d4788bdd", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.04603390140846495, "ground_truth": 0}, {"key": "ef96a6c54daaf4fef676a69305e26fa1d4788bdd", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.26740816907183146, "ground_truth": 0}, {"key": "ef96a6c54daaf4fef676a69305e26fa1d4788bdd", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.06371499374650598, "ground_truth": 0}, {"key": "ef96a6c54daaf4fef676a69305e26fa1d4788bdd", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.2798285012086633, "ground_truth": 0}, {"key": "ef96a6c54daaf4fef676a69305e26fa1d4788bdd", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.09203285785324088, "ground_truth": 0}, {"key": "d9ec8c3e50de1d5af4524c26c6819e17b64090aa", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.7325918293278426, "ground_truth": 0}, {"key": "d9ec8c3e50de1d5af4524c26c6819e17b64090aa", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.8289388168509765, "ground_truth": 0}, {"key": "d9ec8c3e50de1d5af4524c26c6819e17b64090aa", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.4532618437072334, "ground_truth": 0}, {"key": "d9ec8c3e50de1d5af4524c26c6819e17b64090aa", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.8795611845550397, "ground_truth": 0}, {"key": "d9ec8c3e50de1d5af4524c26c6819e17b64090aa", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.8661325160921934, "ground_truth": 0}, {"key": "b6072611b97e8c19ba2d7e0dfce153f046dd629d", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.11436852655579596, "ground_truth": 0}, {"key": "b6072611b97e8c19ba2d7e0dfce153f046dd629d", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.06097518200958186, "ground_truth": 0}, {"key": "b6072611b97e8c19ba2d7e0dfce153f046dd629d", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.08882028866973704, "ground_truth": 0}, {"key": "b6072611b97e8c19ba2d7e0dfce153f046dd629d", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.10447731943428032, "ground_truth": 0}, {"key": "b6072611b97e8c19ba2d7e0dfce153f046dd629d", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.04336580035328471, "ground_truth": 0}, {"key": "2cf81cee664ebcb027a48259e34e512a79aceecb", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.24508499865292666, "ground_truth": 0}, {"key": "2cf81cee664ebcb027a48259e34e512a79aceecb", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.4863315268950157, "ground_truth": 0}, {"key": "2cf81cee664ebcb027a48259e34e512a79aceecb", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.5813030637890464, "ground_truth": 0}, {"key": "2cf81cee664ebcb027a48259e34e512a79aceecb", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.19193279464133328, "ground_truth": 0}, {"key": "2cf81cee664ebcb027a48259e34e512a79aceecb", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.2909808755414383, "ground_truth": 0}, {"key": "b037b44fc06a2d89d95dc7b4453b87371a34fe2f", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.6619228772761525, "ground_truth": 0}, {"key": "b037b44fc06a2d89d95dc7b4453b87371a34fe2f", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.7209580372472328, "ground_truth": 0}, {"key": "b037b44fc06a2d89d95dc7b4453b87371a34fe2f", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.6706082855949119, "ground_truth": 0}, {"key": "b037b44fc06a2d89d95dc7b4453b87371a34fe2f", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.6001883340911428, "ground_truth": 0}, {"key": "b037b44fc06a2d89d95dc7b4453b87371a34fe2f", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.723309466008549, "ground_truth": 0}, {"key": "b1ea881f21e2b58e247b5894d4f259cf86b4d1dd", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.06418264300626608, "ground_truth": 0}, {"key": "b1ea881f21e2b58e247b5894d4f259cf86b4d1dd", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.42441200373478205, "ground_truth": 0}, {"key": "b1ea881f21e2b58e247b5894d4f259cf86b4d1dd", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.47268348867605026, "ground_truth": 0}, {"key": "b1ea881f21e2b58e247b5894d4f259cf86b4d1dd", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.04977344612187883, "ground_truth": 0}, {"key": "b1ea881f21e2b58e247b5894d4f259cf86b4d1dd", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.1699562411930267, "ground_truth": 0}, {"key": "d80e6a3be826df05df00a87f49cc426fd597f085", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.67917869322214, "ground_truth": 0}, {"key": "d80e6a3be826df05df00a87f49cc426fd597f085", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.7295197788944552, "ground_truth": 0}, {"key": "d80e6a3be826df05df00a87f49cc426fd597f085", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.6557770278450932, "ground_truth": 0}, {"key": "d80e6a3be826df05df00a87f49cc426fd597f085", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.9043130607843415, "ground_truth": 0}, {"key": "d80e6a3be826df05df00a87f49cc426fd597f085", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.5794004025808811, "ground_truth": 0}, {"key": "05216d3837745866d393f0e07be7ba801dc330f6", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.3363310448028124, "ground_truth": 0}, {"key": "05216d3837745866d393f0e07be7ba801dc330f6", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.2766905260890076, "ground_truth": 0}, {"key": "05216d3837745866d393f0e07be7ba801dc330f6", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.3757064665659282, "ground_truth": 0}, {"key": "05216d3837745866d393f0e07be7ba801dc330f6", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.48047867330889993, "ground_truth": 0}, {"key": "05216d3837745866d393f0e07be7ba801dc330f6", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.2523840400749836, "ground_truth": 0}, {"key": "a204e3551445183cf53ae355e532a2db731c0c30", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.35398631689950644, "ground_truth": 0}, {"key": "a204e3551445183cf53ae355e532a2db731c0c30", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.7704647803711455, "ground_truth": 0}, {"key": "a204e3551445183cf53ae355e532a2db731c0c30", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.5331543929757921, "ground_truth": 0}, {"key": "a204e3551445183cf53ae355e532a2db731c0c30", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.3345894449302314, "ground_truth": 0}, {"key": "a204e3551445183cf53ae355e532a2db731c0c30", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.6893056070642474, "ground_truth": 0}, {"key": "047e7bc4c7ea5f7df08d4efc443ac8a3479649f1", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.2523840432902024, "ground_truth": 0}, {"key": "047e7bc4c7ea5f7df08d4efc443ac8a3479649f1", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.4244120152551697, "ground_truth": 0}, {"key": "047e7bc4c7ea5f7df08d4efc443ac8a3479649f1", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.18242552922538172, "ground_truth": 0}, {"key": "047e7bc4c7ea5f7df08d4efc443ac8a3479649f1", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.22000709146880815, "ground_truth": 0}, {"key": "047e7bc4c7ea5f7df08d4efc443ac8a3479649f1", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.18359363071250198, "ground_truth": 0}, {"key": "dee467e11f253e70ec843c45fb373da06eace6be", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.2094696943626451, "ground_truth": 0}, {"key": "dee467e11f253e70ec843c45fb373da06eace6be", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.4474603115981765, "ground_truth": 0}, {"key": "dee467e11f253e70ec843c45fb373da06eace6be", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.6242935265128841, "ground_truth": 0}, {"key": "dee467e11f253e70ec843c45fb373da06eace6be", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.21206881397498512, "ground_truth": 0}, {"key": "dee467e11f253e70ec843c45fb373da06eace6be", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.19559408655211719, "ground_truth": 0}, {"key": "054891b9199a73152564cc5be925250ea282bb00", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.3522017784002886, "ground_truth": 0}, {"key": "054891b9199a73152564cc5be925250ea282bb00", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.6808786120374909, "ground_truth": 0}, {"key": "054891b9199a73152564cc5be925250ea282bb00", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.3904758514984212, "ground_truth": 0}, {"key": "054891b9199a73152564cc5be925250ea282bb00", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.24944722652978643, "ground_truth": 0}, {"key": "054891b9199a73152564cc5be925250ea282bb00", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.13846179477594556, "ground_truth": 0}, {"key": "82a94cf607660eb67aac057e3f5028c4cae75abf", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.1907240162077536, "ground_truth": 0}, {"key": "82a94cf607660eb67aac057e3f5028c4cae75abf", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.8255897225196938, "ground_truth": 0}, {"key": "82a94cf607660eb67aac057e3f5028c4cae75abf", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.25386101726913596, "ground_truth": 0}, {"key": "82a94cf607660eb67aac057e3f5028c4cae75abf", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.05834584142777327, "ground_truth": 0}, {"key": "82a94cf607660eb67aac057e3f5028c4cae75abf", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.13892842949341902, "ground_truth": 0}, {"key": "58bf14c936eb7e9a6561599014fefd77ef6c457e", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.7017130657062042, "ground_truth": 0}, {"key": "58bf14c936eb7e9a6561599014fefd77ef6c457e", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.7839884638227216, "ground_truth": 0}, {"key": "58bf14c936eb7e9a6561599014fefd77ef6c457e", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.7994423283739513, "ground_truth": 0}, {"key": "58bf14c936eb7e9a6561599014fefd77ef6c457e", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.47463118837889523, "ground_truth": 0}, {"key": "58bf14c936eb7e9a6561599014fefd77ef6c457e", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.48633153293748427, "ground_truth": 0}, {"key": "5574fe023e3127f0c206ac89eb06abf5a7400438", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.13161904600404473, "ground_truth": 0}, {"key": "5574fe023e3127f0c206ac89eb06abf5a7400438", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.39887464149056984, "ground_truth": 0}, {"key": "5574fe023e3127f0c206ac89eb06abf5a7400438", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.13117321942919796, "ground_truth": 0}, {"key": "5574fe023e3127f0c206ac89eb06abf5a7400438", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.24364244069642205, "ground_truth": 0}, {"key": "5574fe023e3127f0c206ac89eb06abf5a7400438", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.21866936700496253, "ground_truth": 0}, {"key": "e88be1fa30cb6557d422788b5c469b7ba7ca8bfc", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.4130035764085653, "ground_truth": 0}, {"key": "e88be1fa30cb6557d422788b5c469b7ba7ca8bfc", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.5506073600356067, "ground_truth": 0}, {"key": "e88be1fa30cb6557d422788b5c469b7ba7ca8bfc", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.6352224381914001, "ground_truth": 0}, {"key": "e88be1fa30cb6557d422788b5c469b7ba7ca8bfc", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.7201714868269842, "ground_truth": 0}, {"key": "e88be1fa30cb6557d422788b5c469b7ba7ca8bfc", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.8056321733444256, "ground_truth": 0}, {"key": "62f05476ec5198ceb345ce4f45d7d0e70f499ad7", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.5983121923471373, "ground_truth": 0}, {"key": "62f05476ec5198ceb345ce4f45d7d0e70f499ad7", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.5389832160718635, "ground_truth": 0}, {"key": "62f05476ec5198ceb345ce4f45d7d0e70f499ad7", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.5832033512181772, "ground_truth": 0}, {"key": "62f05476ec5198ceb345ce4f45d7d0e70f499ad7", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.22541660060006016, "ground_truth": 0}, {"key": "62f05476ec5198ceb345ce4f45d7d0e70f499ad7", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.8227594795682843, "ground_truth": 0}, {"key": "8cc719f761556a81a71c2dd1b703749c2059df10", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.012336101446866404, "ground_truth": 0}, {"key": "8cc719f761556a81a71c2dd1b703749c2059df10", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.03055986234916719, "ground_truth": 0}, {"key": "8cc719f761556a81a71c2dd1b703749c2059df10", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.011869120472444221, "ground_truth": 0}, {"key": "8cc719f761556a81a71c2dd1b703749c2059df10", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.014227046992085393, "ground_truth": 0}, {"key": "8cc719f761556a81a71c2dd1b703749c2059df10", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.02245705601340959, "ground_truth": 0}, {"key": "2d89b0d0827a0a1e9e855de7717407cdff63b1f5", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.016215031582041555, "ground_truth": 0}, {"key": "2d89b0d0827a0a1e9e855de7717407cdff63b1f5", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.07107366812029337, "ground_truth": 0}, {"key": "2d89b0d0827a0a1e9e855de7717407cdff63b1f5", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.07807816089791283, "ground_truth": 0}, {"key": "2d89b0d0827a0a1e9e855de7717407cdff63b1f5", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.053799643108535584, "ground_truth": 0}, {"key": "2d89b0d0827a0a1e9e855de7717407cdff63b1f5", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.03817827499670047, "ground_truth": 0}, {"key": "41431356e1e7c6f94057b262cd284987f9edb184", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.06512754720713375, "ground_truth": 0}, {"key": "41431356e1e7c6f94057b262cd284987f9edb184", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.02120612029669873, "ground_truth": 0}, {"key": "41431356e1e7c6f94057b262cd284987f9edb184", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.05749327664707673, "ground_truth": 0}, {"key": "41431356e1e7c6f94057b262cd284987f9edb184", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.05070536480773717, "ground_truth": 0}, {"key": "41431356e1e7c6f94057b262cd284987f9edb184", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.08509904476045764, "ground_truth": 0}, {"key": "50872fa30632af8f4c65fb9f952ea8e1b13043c9", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.680029257549656, "ground_truth": 0}, {"key": "50872fa30632af8f4c65fb9f952ea8e1b13043c9", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.7295197779219613, "ground_truth": 0}, {"key": "50872fa30632af8f4c65fb9f952ea8e1b13043c9", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.38121957306675963, "ground_truth": 0}, {"key": "50872fa30632af8f4c65fb9f952ea8e1b13043c9", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.34864514334192326, "ground_truth": 0}, {"key": "50872fa30632af8f4c65fb9f952ea8e1b13043c9", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.7669924707497917, "ground_truth": 0}, {"key": "4a403faad8116c40f4cb960d3ffad081106341ad", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.08540366965925775, "ground_truth": 0}, {"key": "4a403faad8116c40f4cb960d3ffad081106341ad", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.361164731296685, "ground_truth": 0}, {"key": "4a403faad8116c40f4cb960d3ffad081106341ad", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.20946968078215034, "ground_truth": 0}, {"key": "4a403faad8116c40f4cb960d3ffad081106341ad", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.06371499414022021, "ground_truth": 0}, {"key": "4a403faad8116c40f4cb960d3ffad081106341ad", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.10818895548189401, "ground_truth": 0}, {"key": "6f6964470c122807573653173b45b8e00bb59696", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.4282334117267615, "ground_truth": 0}, {"key": "6f6964470c122807573653173b45b8e00bb59696", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.680878617415853, "ground_truth": 0}, {"key": "6f6964470c122807573653173b45b8e00bb59696", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.14903530861580402, "ground_truth": 0}, {"key": "6f6964470c122807573653173b45b8e00bb59696", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.5292633961558582, "ground_truth": 0}, {"key": "6f6964470c122807573653173b45b8e00bb59696", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.23510839841446055, "ground_truth": 0}, {"key": "75c6e27a38b72bb9f75fa2b8e45e933bae10dac5", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.7745833880675216, "ground_truth": 0}, {"key": "75c6e27a38b72bb9f75fa2b8e45e933bae10dac5", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.6433293172872216, "ground_truth": 0}, {"key": "75c6e27a38b72bb9f75fa2b8e45e933bae10dac5", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.5097643961856255, "ground_truth": 0}, {"key": "75c6e27a38b72bb9f75fa2b8e45e933bae10dac5", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.8418256437719809, "ground_truth": 0}, {"key": "75c6e27a38b72bb9f75fa2b8e45e933bae10dac5", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.8783142486581932, "ground_truth": 0}, {"key": "9aa6463127d1efcba4403a185b29849a3688db8d", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.43590152826491607, "ground_truth": 0}, {"key": "9aa6463127d1efcba4403a185b29849a3688db8d", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.18713269039292024, "ground_truth": 0}, {"key": "9aa6463127d1efcba4403a185b29849a3688db8d", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.29421496691261856, "ground_truth": 0}, {"key": "9aa6463127d1efcba4403a185b29849a3688db8d", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.25238403868367404, "ground_truth": 0}, {"key": "9aa6463127d1efcba4403a185b29849a3688db8d", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.09467769989754392, "ground_truth": 0}, {"key": "97eda06b374f07cd9495962465775bde7d44da31", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.035144845260584576, "ground_truth": 0}, {"key": "97eda06b374f07cd9495962465775bde7d44da31", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.10970576782807501, "ground_truth": 0}, {"key": "97eda06b374f07cd9495962465775bde7d44da31", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.027272668879708684, "ground_truth": 0}, {"key": "97eda06b374f07cd9495962465775bde7d44da31", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.15152934368688925, "ground_truth": 0}, {"key": "97eda06b374f07cd9495962465775bde7d44da31", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.009485713862677369, "ground_truth": 0}, {"key": "99a6049d67c1cee35f9703ccb8e6f62a4928295a", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.2704802359926578, "ground_truth": 0}, {"key": "99a6049d67c1cee35f9703ccb8e6f62a4928295a", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.2658804736698039, "ground_truth": 0}, {"key": "99a6049d67c1cee35f9703ccb8e6f62a4928295a", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.1943678302717628, "ground_truth": 0}, {"key": "99a6049d67c1cee35f9703ccb8e6f62a4928295a", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.30074559195521783, "ground_truth": 0}, {"key": "99a6049d67c1cee35f9703ccb8e6f62a4928295a", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.2213506975080628, "ground_truth": 0}, {"key": "adcb3e7b4bef0f9efe7a838b56131ca99b587743", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.4148988449445479, "ground_truth": 0}, {"key": "adcb3e7b4bef0f9efe7a838b56131ca99b587743", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.35042138843052817, "ground_truth": 0}, {"key": "adcb3e7b4bef0f9efe7a838b56131ca99b587743", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.194367824969126, "ground_truth": 0}, {"key": "adcb3e7b4bef0f9efe7a838b56131ca99b587743", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.41111087118822254, "ground_truth": 0}, {"key": "adcb3e7b4bef0f9efe7a838b56131ca99b587743", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.5573634886913172, "ground_truth": 0}, {"key": "bf7cc4e7872b7471a8ef858b8aa45eca090171da", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.18832398734461456, "ground_truth": 0}, {"key": "bf7cc4e7872b7471a8ef858b8aa45eca090171da", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.279828516330932, "ground_truth": 0}, {"key": "bf7cc4e7872b7471a8ef858b8aa45eca090171da", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.2351083901677937, "ground_truth": 0}, {"key": "bf7cc4e7872b7471a8ef858b8aa45eca090171da", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.3123700087633785, "ground_truth": 0}, {"key": "bf7cc4e7872b7471a8ef858b8aa45eca090171da", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.11838509796466323, "ground_truth": 0}, {"key": "62785b99e4007fad95ce55d427046e14aef476a4", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.14463144857562163, "ground_truth": 0}, {"key": "62785b99e4007fad95ce55d427046e14aef476a4", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.21933749949327822, "ground_truth": 0}, {"key": "62785b99e4007fad95ce55d427046e14aef476a4", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.11757214084797071, "ground_truth": 0}, {"key": "62785b99e4007fad95ce55d427046e14aef476a4", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.10484336377021905, "ground_truth": 0}, {"key": "62785b99e4007fad95ce55d427046e14aef476a4", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.09739039783708713, "ground_truth": 0}, {"key": "62fcd4ca096a182c292ae3609444bbc7af15eab6", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.08632347640328214, "ground_truth": 0}, {"key": "62fcd4ca096a182c292ae3609444bbc7af15eab6", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.10856642307988171, "ground_truth": 0}, {"key": "62fcd4ca096a182c292ae3609444bbc7af15eab6", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.2173375186578632, "ground_truth": 0}, {"key": "62fcd4ca096a182c292ae3609444bbc7af15eab6", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.10894503776439336, "ground_truth": 0}, {"key": "62fcd4ca096a182c292ae3609444bbc7af15eab6", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.11838509315329179, "ground_truth": 0}, {"key": "afdbd1bc7c79a936601b3c6cae4622464641d3a5", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.40922079825024904, "ground_truth": 0}, {"key": "afdbd1bc7c79a936601b3c6cae4622464641d3a5", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.3208213111770611, "ground_truth": 0}, {"key": "afdbd1bc7c79a936601b3c6cae4622464641d3a5", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.10484336285800738, "ground_truth": 0}, {"key": "afdbd1bc7c79a936601b3c6cae4622464641d3a5", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.3923368328204679, "ground_truth": 0}, {"key": "afdbd1bc7c79a936601b3c6cae4622464641d3a5", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.4397473269108111, "ground_truth": 0}, {"key": "2a2a0fd7b85ec6f9145761795bae420d7eb84f44", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.036769463847817124, "ground_truth": 0}, {"key": "2a2a0fd7b85ec6f9145761795bae420d7eb84f44", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.058776558917616406, "ground_truth": 0}, {"key": "2a2a0fd7b85ec6f9145761795bae420d7eb84f44", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.009783875899841142, "ground_truth": 0}, {"key": "2a2a0fd7b85ec6f9145761795bae420d7eb84f44", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.014392336124373517, "ground_truth": 0}, {"key": "2a2a0fd7b85ec6f9145761795bae420d7eb84f44", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.01307078535904877, "ground_truth": 0}, {"key": "f3d07208d0059d738fc7788a4ce813309b677d7b", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.06097518327580221, "ground_truth": 0}, {"key": "f3d07208d0059d738fc7788a4ce813309b677d7b", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.034488525841596715, "ground_truth": 0}, {"key": "f3d07208d0059d738fc7788a4ce813309b677d7b", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.042087727674791034, "ground_truth": 0}, {"key": "f3d07208d0059d738fc7788a4ce813309b677d7b", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.047602656110535185, "ground_truth": 0}, {"key": "f3d07208d0059d738fc7788a4ce813309b677d7b", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.02096424209006638, "ground_truth": 0}, {"key": "2b8840981769a4a8f93d2e82e609ab169165cd3c", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.052618956040364415, "ground_truth": 0}, {"key": "2b8840981769a4a8f93d2e82e609ab169165cd3c", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.053601144556782034, "ground_truth": 0}, {"key": "2b8840981769a4a8f93d2e82e609ab169165cd3c", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.1623800308216568, "ground_truth": 0}, {"key": "2b8840981769a4a8f93d2e82e609ab169165cd3c", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.07263670475371949, "ground_truth": 0}, {"key": "2b8840981769a4a8f93d2e82e609ab169165cd3c", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.2568320068512379, "ground_truth": 0}, {"key": "4b23ce1db7253bf118b493c9bea7d6899012cc88", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.030908960240496035, "ground_truth": 0}, {"key": "4b23ce1db7253bf118b493c9bea7d6899012cc88", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.06512754883728217, "ground_truth": 0}, {"key": "4b23ce1db7253bf118b493c9bea7d6899012cc88", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.02822098585744574, "ground_truth": 0}, {"key": "4b23ce1db7253bf118b493c9bea7d6899012cc88", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.037467510373065116, "ground_truth": 0}, {"key": "4b23ce1db7253bf118b493c9bea7d6899012cc88", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.05300977388464074, "ground_truth": 0}, {"key": "c220780a60f76cdd1f6fd9a84abac736c3ee8ace", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.07055959759804054, "ground_truth": 0}, {"key": "c220780a60f76cdd1f6fd9a84abac736c3ee8ace", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.08725224370439126, "ground_truth": 0}, {"key": "c220780a60f76cdd1f6fd9a84abac736c3ee8ace", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.13206614850696438, "ground_truth": 0}, {"key": "c220780a60f76cdd1f6fd9a84abac736c3ee8ace", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.13753247650066616, "ground_truth": 0}, {"key": "c220780a60f76cdd1f6fd9a84abac736c3ee8ace", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.09877259009943057, "ground_truth": 0}, {"key": "9c7687a36469fc0e2203edb31f303274a611fb12", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.3157359792018042, "ground_truth": 0}, {"key": "9c7687a36469fc0e2203edb31f303274a611fb12", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.41111086957599763, "ground_truth": 0}, {"key": "9c7687a36469fc0e2203edb31f303274a611fb12", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.22405544640229874, "ground_truth": 0}, {"key": "9c7687a36469fc0e2203edb31f303274a611fb12", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.22815649459701176, "ground_truth": 0}, {"key": "9c7687a36469fc0e2203edb31f303274a611fb12", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.30239109386947566, "ground_truth": 0}, {"key": "8ab7fe3b19bb45c977cb74ed675579a20611ad9b", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.022201229046694627, "ground_truth": 0}, {"key": "8ab7fe3b19bb45c977cb74ed675579a20611ad9b", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.00475519996042182, "ground_truth": 0}, {"key": "8ab7fe3b19bb45c977cb74ed675579a20611ad9b", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.012053779466367804, "ground_truth": 0}, {"key": "8ab7fe3b19bb45c977cb74ed675579a20611ad9b", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.004591683957496465, "ground_truth": 0}, {"key": "8ab7fe3b19bb45c977cb74ed675579a20611ad9b", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.02655657215475204, "ground_truth": 0}, {"key": "dfedf6786976733d8e33e7848ea8a7aa735bbcab", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.11556088398491092, "ground_truth": 0}, {"key": "dfedf6786976733d8e33e7848ea8a7aa735bbcab", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.20689406344909247, "ground_truth": 0}, {"key": "dfedf6786976733d8e33e7848ea8a7aa735bbcab", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.07921031746884061, "ground_truth": 0}, {"key": "dfedf6786976733d8e33e7848ea8a7aa735bbcab", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.0866320638030821, "ground_truth": 0}, {"key": "dfedf6786976733d8e33e7848ea8a7aa735bbcab", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.1490353016857873, "ground_truth": 0}, {"key": "825f58580dd78cdcc7fbc10a00807e043c7b4468", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.09670579744588186, "ground_truth": 0}, {"key": "825f58580dd78cdcc7fbc10a00807e043c7b4468", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.08945460396786666, "ground_truth": 0}, {"key": "825f58580dd78cdcc7fbc10a00807e043c7b4468", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.04240382861570379, "ground_truth": 0}, {"key": "825f58580dd78cdcc7fbc10a00807e043c7b4468", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.0651275491114555, "ground_truth": 0}, {"key": "825f58580dd78cdcc7fbc10a00807e043c7b4468", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.4167966546943955, "ground_truth": 0}, {"key": "8bd6dc9f3ebb23fe20f74c1956184064b5b95509", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.8386797644511887, "ground_truth": 0}, {"key": "8bd6dc9f3ebb23fe20f74c1956184064b5b95509", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.8289388168509765, "ground_truth": 0}, {"key": "8bd6dc9f3ebb23fe20f74c1956184064b5b95509", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.9227612154472725, "ground_truth": 0}, {"key": "8bd6dc9f3ebb23fe20f74c1956184064b5b95509", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.7520125534615949, "ground_truth": 0}, {"key": "8bd6dc9f3ebb23fe20f74c1956184064b5b95509", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.834945918203746, "ground_truth": 0}, {"key": "a7f6d4487a3ba7c4fc29e9b410820891f4c4f086", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.420599604586799, "ground_truth": 0}, {"key": "a7f6d4487a3ba7c4fc29e9b410820891f4c4f086", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.12678517372517983, "ground_truth": 0}, {"key": "a7f6d4487a3ba7c4fc29e9b410820891f4c4f086", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.198064186490398, "ground_truth": 0}, {"key": "a7f6d4487a3ba7c4fc29e9b410820891f4c4f086", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.2358115930380041, "ground_truth": 0}, {"key": "a7f6d4487a3ba7c4fc29e9b410820891f4c4f086", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.4263215908014307, "ground_truth": 0}, {"key": "b27ad09982665477dacdb7d06a33134bf064dd8d", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.027795625429521395, "ground_truth": 0}, {"key": "b27ad09982665477dacdb7d06a33134bf064dd8d", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.185947203860616, "ground_truth": 0}, {"key": "b27ad09982665477dacdb7d06a33134bf064dd8d", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.09170696343821036, "ground_truth": 0}, {"key": "b27ad09982665477dacdb7d06a33134bf064dd8d", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.0695417414382217, "ground_truth": 0}, {"key": "b27ad09982665477dacdb7d06a33134bf064dd8d", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.07696083915282619, "ground_truth": 0}, {"key": "905891c3a21e76ad63d63dfe55e569a4cab25583", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.3056973126980589, "ground_truth": 0}, {"key": "905891c3a21e76ad63d63dfe55e569a4cab25583", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.19436782050051452, "ground_truth": 0}, {"key": "905891c3a21e76ad63d63dfe55e569a4cab25583", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.12085324019757795, "ground_truth": 0}, {"key": "905891c3a21e76ad63d63dfe55e569a4cab25583", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.18713269147737235, "ground_truth": 0}, {"key": "905891c3a21e76ad63d63dfe55e569a4cab25583", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.4824291196314642, "ground_truth": 0}, {"key": "626460b8ec58252c82ff5513aa754190332780aa", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.0953494611183001, "ground_truth": 0}, {"key": "626460b8ec58252c82ff5513aa754190332780aa", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.1847675118013897, "ground_truth": 0}, {"key": "626460b8ec58252c82ff5513aa754190332780aa", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.0448479037248405, "ground_truth": 0}, {"key": "626460b8ec58252c82ff5513aa754190332780aa", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.018689308096740666, "ground_truth": 0}, {"key": "626460b8ec58252c82ff5513aa754190332780aa", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.039342505142431664, "ground_truth": 0}, {"key": "31d0ed7b1b8f65c6479fb35683d72de21d70796a", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.8828325249089605, "ground_truth": 0}, {"key": "31d0ed7b1b8f65c6479fb35683d72de21d70796a", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.9069832035356767, "ground_truth": 0}, {"key": "31d0ed7b1b8f65c6479fb35683d72de21d70796a", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.9469902227751337, "ground_truth": 0}, {"key": "31d0ed7b1b8f65c6479fb35683d72de21d70796a", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.7911764307030938, "ground_truth": 0}, {"key": "31d0ed7b1b8f65c6479fb35683d72de21d70796a", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.7918210748612536, "ground_truth": 0}, {"key": "b03ee4df6492038d0a1d99a1717d8ad8ccc06db3", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.008251599116101349, "ground_truth": 0}, {"key": "b03ee4df6492038d0a1d99a1717d8ad8ccc06db3", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.1634454246787896, "ground_truth": 0}, {"key": "b03ee4df6492038d0a1d99a1717d8ad8ccc06db3", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.025371311013907175, "ground_truth": 0}, {"key": "b03ee4df6492038d0a1d99a1717d8ad8ccc06db3", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.10374862527696964, "ground_truth": 0}, {"key": "b03ee4df6492038d0a1d99a1717d8ad8ccc06db3", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.03817827546162763, "ground_truth": 0}, {"key": "ad9abc78fb2de88267b854f2aed110e2a5b8c3f1", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.7371581653813888, "ground_truth": 0}, {"key": "ad9abc78fb2de88267b854f2aed110e2a5b8c3f1", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.5660185315131206, "ground_truth": 0}, {"key": "ad9abc78fb2de88267b854f2aed110e2a5b8c3f1", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.7620701120422216, "ground_truth": 0}, {"key": "ad9abc78fb2de88267b854f2aed110e2a5b8c3f1", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.7606506535438059, "ground_truth": 0}, {"key": "ad9abc78fb2de88267b854f2aed110e2a5b8c3f1", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.7490872008574908, "ground_truth": 0}, {"key": "75cc16a7ba1970ba791da4ba43e6220f37f47697", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.7592254138182879, "ground_truth": 0}, {"key": "75cc16a7ba1970ba791da4ba43e6220f37f47697", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.7008947968564783, "ground_truth": 0}, {"key": "75cc16a7ba1970ba791da4ba43e6220f37f47697", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.8929365445808477, "ground_truth": 0}, {"key": "75cc16a7ba1970ba791da4ba43e6220f37f47697", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.8994751321638701, "ground_truth": 0}, {"key": "75cc16a7ba1970ba791da4ba43e6220f37f47697", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.8816149074104472, "ground_truth": 0}, {"key": "fe9d63d0ed719a42735cadaf10e76416545f680c", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.3886180094081231, "ground_truth": 0}, {"key": "fe9d63d0ed719a42735cadaf10e76416545f680c", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.46879064774083745, "ground_truth": 0}, {"key": "fe9d63d0ed719a42735cadaf10e76416545f680c", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.30239109660437313, "ground_truth": 0}, {"key": "fe9d63d0ed719a42735cadaf10e76416545f680c", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.45907612767288686, "ground_truth": 0}, {"key": "fe9d63d0ed719a42735cadaf10e76416545f680c", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.34687309300361646, "ground_truth": 0}, {"key": "1744093a3fea8b8de0777b1a228c3ba3e515d48e", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.10743746481860104, "ground_truth": 0}, {"key": "1744093a3fea8b8de0777b1a228c3ba3e515d48e", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.21076628877722864, "ground_truth": 0}, {"key": "1744093a3fea8b8de0777b1a228c3ba3e515d48e", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.08787644255814807, "ground_truth": 0}, {"key": "1744093a3fea8b8de0777b1a228c3ba3e515d48e", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.0926877770121146, "ground_truth": 0}, {"key": "1744093a3fea8b8de0777b1a228c3ba3e515d48e", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.037750276501570174, "ground_truth": 0}, {"key": "4929479f70e89deb22539e7d2caa6c33bbb0a14f", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.25832598585838185, "ground_truth": 0}, {"key": "4929479f70e89deb22539e7d2caa6c33bbb0a14f", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.2200071003248128, "ground_truth": 0}, {"key": "4929479f70e89deb22539e7d2caa6c33bbb0a14f", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.2568320044973509, "ground_truth": 0}, {"key": "4929479f70e89deb22539e7d2caa6c33bbb0a14f", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.40168780440652607, "ground_truth": 0}, {"key": "4929479f70e89deb22539e7d2caa6c33bbb0a14f", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.32423538384709844, "ground_truth": 0}, {"key": "4dd3bb1fe7a5b0d42f0df8d9e62b81c673475420", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.32766828700559725, "ground_truth": 0}, {"key": "4dd3bb1fe7a5b0d42f0df8d9e62b81c673475420", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.12506538794394945, "ground_truth": 0}, {"key": "4dd3bb1fe7a5b0d42f0df8d9e62b81c673475420", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.3504213796855986, "ground_truth": 0}, {"key": "4dd3bb1fe7a5b0d42f0df8d9e62b81c673475420", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.16026604200450956, "ground_truth": 0}, {"key": "4dd3bb1fe7a5b0d42f0df8d9e62b81c673475420", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.1613202430507176, "ground_truth": 0}, {"key": "32f0c7b0845e88c7ff34bb9d358a86e029dc2261", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.011823395455823563, "ground_truth": 0}, {"key": "32f0c7b0845e88c7ff34bb9d358a86e029dc2261", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.00475519996042182, "ground_truth": 0}, {"key": "32f0c7b0845e88c7ff34bb9d358a86e029dc2261", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.03718677711845281, "ground_truth": 0}, {"key": "32f0c7b0845e88c7ff34bb9d358a86e029dc2261", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.008544330735112654, "ground_truth": 0}, {"key": "32f0c7b0845e88c7ff34bb9d358a86e029dc2261", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.02655657215475204, "ground_truth": 0}, {"key": "607ce3caeeac56d7c4250aaa161871535cd1251e", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.15713685993225152, "ground_truth": 0}, {"key": "607ce3caeeac56d7c4250aaa161871535cd1251e", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.18772760708314928, "ground_truth": 0}, {"key": "607ce3caeeac56d7c4250aaa161871535cd1251e", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.16613355265272692, "ground_truth": 0}, {"key": "607ce3caeeac56d7c4250aaa161871535cd1251e", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.22815648695453547, "ground_truth": 0}, {"key": "607ce3caeeac56d7c4250aaa161871535cd1251e", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.4339814599771661, "ground_truth": 0}, {"key": "7fb19f75d5d3feefeababf62d2ac91bf684a8038", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.6197014578631489, "ground_truth": 0}, {"key": "7fb19f75d5d3feefeababf62d2ac91bf684a8038", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.6460136873234914, "ground_truth": 0}, {"key": "7fb19f75d5d3feefeababf62d2ac91bf684a8038", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.23722232099370685, "ground_truth": 0}, {"key": "7fb19f75d5d3feefeababf62d2ac91bf684a8038", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.41111085782529916, "ground_truth": 0}, {"key": "7fb19f75d5d3feefeababf62d2ac91bf684a8038", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.4804786675704537, "ground_truth": 0}, {"key": "4a70f83728ee66801be719df00060cda4c25817f", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.4474602954009152, "ground_truth": 0}, {"key": "4a70f83728ee66801be719df00060cda4c25817f", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.35398630747597293, "ground_truth": 0}, {"key": "4a70f83728ee66801be719df00060cda4c25817f", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.501953128368964, "ground_truth": 0}, {"key": "4a70f83728ee66801be719df00060cda4c25817f", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.2861692573308722, "ground_truth": 0}, {"key": "4a70f83728ee66801be719df00060cda4c25817f", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.46684559331442754, "ground_truth": 0}, {"key": "dcfc0e6ff732124026991e89d50727876f50351f", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.04272219933045805, "ground_truth": 0}, {"key": "dcfc0e6ff732124026991e89d50727876f50351f", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.11596071074501595, "ground_truth": 0}, {"key": "dcfc0e6ff732124026991e89d50727876f50351f", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.12506538363812222, "ground_truth": 0}, {"key": "dcfc0e6ff732124026991e89d50727876f50351f", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.07004895879176681, "ground_truth": 0}, {"key": "dcfc0e6ff732124026991e89d50727876f50351f", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.07978200933569488, "ground_truth": 0}, {"key": "ace7f6d9e984397bda16bf441019f1584f036b2a", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.6714705692288209, "ground_truth": 0}, {"key": "ace7f6d9e984397bda16bf441019f1584f036b2a", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.6132365392743221, "ground_truth": 0}, {"key": "ace7f6d9e984397bda16bf441019f1584f036b2a", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.45713669537611246, "ground_truth": 0}, {"key": "ace7f6d9e984397bda16bf441019f1584f036b2a", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.7233094604498307, "ground_truth": 0}, {"key": "ace7f6d9e984397bda16bf441019f1584f036b2a", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.551573736213543, "ground_truth": 0}, {"key": "6f12c9d47e70bfa86d72685d018ddd1161157e8e", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.5312094037981132, "ground_truth": 0}, {"key": "6f12c9d47e70bfa86d72685d018ddd1161157e8e", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.7424217111832666, "ground_truth": 0}, {"key": "6f12c9d47e70bfa86d72685d018ddd1161157e8e", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.7759445405497107, "ground_truth": 0}, {"key": "6f12c9d47e70bfa86d72685d018ddd1161157e8e", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.8000678881978203, "ground_truth": 0}, {"key": "6f12c9d47e70bfa86d72685d018ddd1161157e8e", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.6076632091795144, "ground_truth": 0}, {"key": "b32b72e5cf9e133e5be33eccbb2dc9ab5578ae84", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.18010666901168815, "ground_truth": 0}, {"key": "b32b72e5cf9e133e5be33eccbb2dc9ab5578ae84", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.10970576753368326, "ground_truth": 0}, {"key": "b32b72e5cf9e133e5be33eccbb2dc9ab5578ae84", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.08269734204992617, "ground_truth": 0}, {"key": "b32b72e5cf9e133e5be33eccbb2dc9ab5578ae84", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.1480471859684543, "ground_truth": 0}, {"key": "b32b72e5cf9e133e5be33eccbb2dc9ab5578ae84", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.15713684679272322, "ground_truth": 0}, {"key": "0ae5e35dc2844afc251d082d8d5ef4be8edce58c", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.27202455479939097, "ground_truth": 0}, {"key": "0ae5e35dc2844afc251d082d8d5ef4be8edce58c", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.17781087391462236, "ground_truth": 0}, {"key": "0ae5e35dc2844afc251d082d8d5ef4be8edce58c", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.1795305632389661, "ground_truth": 0}, {"key": "0ae5e35dc2844afc251d082d8d5ef4be8edce58c", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.16238002969322488, "ground_truth": 0}, {"key": "0ae5e35dc2844afc251d082d8d5ef4be8edce58c", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.3398276327933434, "ground_truth": 0}, {"key": "ffb817ce85d7c19720ebbf0b43b01d0da61e9c06", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.1645164570461812, "ground_truth": 0}, {"key": "ffb817ce85d7c19720ebbf0b43b01d0da61e9c06", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.04672495988221243, "ground_truth": 0}, {"key": "ffb817ce85d7c19720ebbf0b43b01d0da61e9c06", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.10374862765289623, "ground_truth": 0}, {"key": "ffb817ce85d7c19720ebbf0b43b01d0da61e9c06", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.10818895768954911, "ground_truth": 0}, {"key": "ffb817ce85d7c19720ebbf0b43b01d0da61e9c06", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.1460872484289207, "ground_truth": 0}, {"key": "9bfd6a5beb4e8dec59ba6d805dc9349a401da51d", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.030329260212826507, "ground_truth": 0}, {"key": "9bfd6a5beb4e8dec59ba6d805dc9349a401da51d", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.10970578111827635, "ground_truth": 0}, {"key": "9bfd6a5beb4e8dec59ba6d805dc9349a401da51d", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.05541279130464194, "ground_truth": 0}, {"key": "9bfd6a5beb4e8dec59ba6d805dc9349a401da51d", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.1267851717622779, "ground_truth": 0}, {"key": "9bfd6a5beb4e8dec59ba6d805dc9349a401da51d", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.0710736648743974, "ground_truth": 0}, {"key": "dc7f4527bf654918c7a4bb19179949ecd5982c0f", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.4282334074240867, "ground_truth": 0}, {"key": "dc7f4527bf654918c7a4bb19179949ecd5982c0f", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.5370414012482241, "ground_truth": 0}, {"key": "dc7f4527bf654918c7a4bb19179949ecd5982c0f", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.6992544131861245, "ground_truth": 0}, {"key": "dc7f4527bf654918c7a4bb19179949ecd5982c0f", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.17895589041393753, "ground_truth": 0}, {"key": "dc7f4527bf654918c7a4bb19179949ecd5982c0f", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.5467381484761848, "ground_truth": 0}, {"key": "c60e77736087bc85b372a28b4724aae6dcf0b052", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.15869518150117373, "ground_truth": 0}, {"key": "c60e77736087bc85b372a28b4724aae6dcf0b052", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.824461927744596, "ground_truth": 0}, {"key": "c60e77736087bc85b372a28b4724aae6dcf0b052", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.26284184436066094, "ground_truth": 0}, {"key": "c60e77736087bc85b372a28b4724aae6dcf0b052", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.17161580282767488, "ground_truth": 0}, {"key": "c60e77736087bc85b372a28b4724aae6dcf0b052", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.3830642033648857, "ground_truth": 0}, {"key": "e0953e2de7cf286ac1d87a41c62e37f21b7c7564", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.11516223255747907, "ground_truth": 0}, {"key": "e0953e2de7cf286ac1d87a41c62e37f21b7c7564", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.11397346576619198, "ground_truth": 0}, {"key": "e0953e2de7cf286ac1d87a41c62e37f21b7c7564", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.2869678771793141, "ground_truth": 0}, {"key": "e0953e2de7cf286ac1d87a41c62e37f21b7c7564", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.14033624669746841, "ground_truth": 0}, {"key": "e0953e2de7cf286ac1d87a41c62e37f21b7c7564", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.08977329125254774, "ground_truth": 0}, {"key": "8b6f228661fd5f3170dc2c2e6b353e1d6c3859ec", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.5832033377310201, "ground_truth": 0}, {"key": "8b6f228661fd5f3170dc2c2e6b353e1d6c3859ec", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.47463117559865076, "ground_truth": 0}, {"key": "8b6f228661fd5f3170dc2c2e6b353e1d6c3859ec", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.5117166059295376, "ground_truth": 0}, {"key": "8b6f228661fd5f3170dc2c2e6b353e1d6c3859ec", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.5945512718641742, "ground_truth": 0}, {"key": "8b6f228661fd5f3170dc2c2e6b353e1d6c3859ec", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.5544704534075653, "ground_truth": 0}, {"key": "2f482e021caf07e2f07baf111c36d1587758f188", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.6876300003010195, "ground_truth": 0}, {"key": "2f482e021caf07e2f07baf111c36d1587758f188", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.5350984292293167, "ground_truth": 0}, {"key": "2f482e021caf07e2f07baf111c36d1587758f188", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.43206340583454134, "ground_truth": 0}, {"key": "2f482e021caf07e2f07baf111c36d1587758f188", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.8875949114425244, "ground_truth": 0}, {"key": "2f482e021caf07e2f07baf111c36d1587758f188", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.4225046128240748, "ground_truth": 0}, {"key": "dc8ce4207b91a323bf6e2fbab889efeed22aa428", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.1112412167993658, "ground_truth": 0}, {"key": "dc8ce4207b91a323bf6e2fbab889efeed22aa428", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.4054487344766392, "ground_truth": 0}, {"key": "dc8ce4207b91a323bf6e2fbab889efeed22aa428", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.3191213847236, "ground_truth": 0}, {"key": "dc8ce4207b91a323bf6e2fbab889efeed22aa428", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.48438007798196636, "ground_truth": 0}, {"key": "dc8ce4207b91a323bf6e2fbab889efeed22aa428", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.10230470220217511, "ground_truth": 0}, {"key": "22a9005fe99c5dd536a4f41de4eb59d4f633ef9e", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.021864557098215703, "ground_truth": 0}, {"key": "22a9005fe99c5dd536a4f41de4eb59d4f633ef9e", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.09807932896325781, "ground_truth": 0}, {"key": "22a9005fe99c5dd536a4f41de4eb59d4f633ef9e", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.053998836727237674, "ground_truth": 0}, {"key": "22a9005fe99c5dd536a4f41de4eb59d4f633ef9e", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.031143832839390807, "ground_truth": 0}, {"key": "22a9005fe99c5dd536a4f41de4eb59d4f633ef9e", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.06030763841708121, "ground_truth": 0}, {"key": "1b00b2d2edef396855ad392f08a6e74550af569b", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.14903529748312624, "ground_truth": 0}, {"key": "1b00b2d2edef396855ad392f08a6e74550af569b", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.21337717433416487, "ground_truth": 0}, {"key": "1b00b2d2edef396855ad392f08a6e74550af569b", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.2160115340798634, "ground_truth": 0}, {"key": "1b00b2d2edef396855ad392f08a6e74550af569b", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.3451052790279975, "ground_truth": 0}, {"key": "1b00b2d2edef396855ad392f08a6e74550af569b", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.2583259742390605, "ground_truth": 0}, {"key": "9b43472077873c45e7f278418885ad028eb993e3", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.1581743539508139, "ground_truth": 0}, {"key": "9b43472077873c45e7f278418885ad028eb993e3", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.4921881357175841, "ground_truth": 0}, {"key": "9b43472077873c45e7f278418885ad028eb993e3", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.6370308173203149, "ground_truth": 0}, {"key": "9b43472077873c45e7f278418885ad028eb993e3", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.5832033456682025, "ground_truth": 0}, {"key": "9b43472077873c45e7f278418885ad028eb993e3", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.08181271157461942, "ground_truth": 0}, {"key": "281347d0e99bc099d6991a6a60e30dc13d558216", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.09334687737900957, "ground_truth": 0}, {"key": "281347d0e99bc099d6991a6a60e30dc13d558216", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.019271137454533245, "ground_truth": 0}, {"key": "281347d0e99bc099d6991a6a60e30dc13d558216", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.029312230470319438, "ground_truth": 0}, {"key": "281347d0e99bc099d6991a6a60e30dc13d558216", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.013532148831900738, "ground_truth": 0}, {"key": "281347d0e99bc099d6991a6a60e30dc13d558216", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.02566270550813192, "ground_truth": 0}, {"key": "703d248cce913a6036347aabd2ba011a7f660bf4", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.11240507623422669, "ground_truth": 0}, {"key": "703d248cce913a6036347aabd2ba011a7f660bf4", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.018978036345630958, "ground_truth": 0}, {"key": "703d248cce913a6036347aabd2ba011a7f660bf4", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.06954174360871623, "ground_truth": 0}, {"key": "703d248cce913a6036347aabd2ba011a7f660bf4", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.19193280186291262, "ground_truth": 0}, {"key": "703d248cce913a6036347aabd2ba011a7f660bf4", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.08449275562735274, "ground_truth": 0}, {"key": "517b86691dda04f41123354c1b7a7bfe1290eadc", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.26284183808298806, "ground_truth": 0}, {"key": "517b86691dda04f41123354c1b7a7bfe1290eadc", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.030908960451230098, "ground_truth": 0}, {"key": "517b86691dda04f41123354c1b7a7bfe1290eadc", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.0956869426896004, "ground_truth": 0}, {"key": "517b86691dda04f41123354c1b7a7bfe1290eadc", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.09877259412490441, "ground_truth": 0}, {"key": "517b86691dda04f41123354c1b7a7bfe1290eadc", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.06903793043293828, "ground_truth": 0}, {"key": "7b361feeebfb078b80831d40d2ad8640c361e049", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.5832033415311151, "ground_truth": 0}, {"key": "7b361feeebfb078b80831d40d2ad8640c361e049", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.8080671907013173, "ground_truth": 0}, {"key": "7b361feeebfb078b80831d40d2ad8640c361e049", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.9238675189686615, "ground_truth": 0}, {"key": "7b361feeebfb078b80831d40d2ad8640c361e049", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.8316905611620661, "ground_truth": 0}, {"key": "7b361feeebfb078b80831d40d2ad8640c361e049", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.8031737917774034, "ground_truth": 0}, {"key": "7d8e196095e4561ee4f01c650101f5591fce4a8d", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.32252599008390664, "ground_truth": 0}, {"key": "7d8e196095e4561ee4f01c650101f5591fce4a8d", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.20882358691766498, "ground_truth": 0}, {"key": "7d8e196095e4561ee4f01c650101f5591fce4a8d", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.2958398670298688, "ground_truth": 0}, {"key": "7d8e196095e4561ee4f01c650101f5591fce4a8d", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.5039061501821146, "ground_truth": 0}, {"key": "7d8e196095e4561ee4f01c650101f5591fce4a8d", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.2160115402057281, "ground_truth": 0}, {"key": "ae03390949407f55c8d8f794896af3020d180b12", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.2643583549836155, "ground_truth": 0}, {"key": "ae03390949407f55c8d8f794896af3020d180b12", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.4378234939188175, "ground_truth": 0}, {"key": "ae03390949407f55c8d8f794896af3020d180b12", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.1859471992631222, "ground_truth": 0}, {"key": "ae03390949407f55c8d8f794896af3020d180b12", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.1895210928844438, "ground_truth": 0}, {"key": "ae03390949407f55c8d8f794896af3020d180b12", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.3575675349261662, "ground_truth": 0}, {"key": "4160464d3fcba547cb1664e54ce51ad06f78b773", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.3904758326836005, "ground_truth": 0}, {"key": "4160464d3fcba547cb1664e54ce51ad06f78b773", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.13206614383005602, "ground_truth": 0}, {"key": "4160464d3fcba547cb1664e54ce51ad06f78b773", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.3647775686465766, "ground_truth": 0}, {"key": "4160464d3fcba547cb1664e54ce51ad06f78b773", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.08977329110966252, "ground_truth": 0}, {"key": "4160464d3fcba547cb1664e54ce51ad06f78b773", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.1490352995281238, "ground_truth": 0}, {"key": "72b396634cc46f29b5ef146a61073ee7e7fa3cdc", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.409220790127916, "ground_truth": 0}, {"key": "72b396634cc46f29b5ef146a61073ee7e7fa3cdc", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.8216173360752701, "ground_truth": 0}, {"key": "72b396634cc46f29b5ef146a61073ee7e7fa3cdc", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.3539863051527663, "ground_truth": 0}, {"key": "72b396634cc46f29b5ef146a61073ee7e7fa3cdc", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.19806417834853982, "ground_truth": 0}, {"key": "72b396634cc46f29b5ef146a61073ee7e7fa3cdc", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.5175709117911295, "ground_truth": 0}, {"key": "b9b09b290cdf4d74cb64684a6cae8b6832645607", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.2766905392364473, "ground_truth": 0}, {"key": "b9b09b290cdf4d74cb64684a6cae8b6832645607", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.1347759201620025, "ground_truth": 0}, {"key": "b9b09b290cdf4d74cb64684a6cae8b6832645607", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.22405545224271925, "ground_truth": 0}, {"key": "b9b09b290cdf4d74cb64684a6cae8b6832645607", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.21206879897833472, "ground_truth": 0}, {"key": "b9b09b290cdf4d74cb64684a6cae8b6832645607", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.26284185744777355, "ground_truth": 0}, {"key": "9e49d58fa5ab7f3e4356cb61337605ac007c49ca", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.09534946427739406, "ground_truth": 0}, {"key": "9e49d58fa5ab7f3e4356cb61337605ac007c49ca", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.2450850171033546, "ground_truth": 0}, {"key": "9e49d58fa5ab7f3e4356cb61337605ac007c49ca", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.06560483267093424, "ground_truth": 0}, {"key": "9e49d58fa5ab7f3e4356cb61337605ac007c49ca", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.14223189270981795, "ground_truth": 0}, {"key": "9e49d58fa5ab7f3e4356cb61337605ac007c49ca", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.10669059999162246, "ground_truth": 0}, {"key": "47fe0e2bba8206014fb53a7d5247efd1e316e087", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.26588047014020594, "ground_truth": 0}, {"key": "47fe0e2bba8206014fb53a7d5247efd1e316e087", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.6645403066226212, "ground_truth": 0}, {"key": "47fe0e2bba8206014fb53a7d5247efd1e316e087", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.19193280056292722, "ground_truth": 0}, {"key": "47fe0e2bba8206014fb53a7d5247efd1e316e087", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.15102780429698018, "ground_truth": 0}, {"key": "47fe0e2bba8206014fb53a7d5247efd1e316e087", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.14033624866457156, "ground_truth": 0}, {"key": "f54f84affaebd1d86011ad31adbf9fac4754a8f2", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.09334687929339706, "ground_truth": 0}, {"key": "f54f84affaebd1d86011ad31adbf9fac4754a8f2", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.11757214440265962, "ground_truth": 0}, {"key": "f54f84affaebd1d86011ad31adbf9fac4754a8f2", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.43206338454108634, "ground_truth": 0}, {"key": "f54f84affaebd1d86011ad31adbf9fac4754a8f2", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.06278920612710934, "ground_truth": 0}, {"key": "f54f84affaebd1d86011ad31adbf9fac4754a8f2", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.49414090190411103, "ground_truth": 0}, {"key": "bc4992871e25e6584936af456ad4b819dcc52f27", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.03890198236524614, "ground_truth": 0}, {"key": "bc4992871e25e6584936af456ad4b819dcc52f27", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.08850466638514291, "ground_truth": 0}, {"key": "bc4992871e25e6584936af456ad4b819dcc52f27", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.07921032281394072, "ground_truth": 0}, {"key": "bc4992871e25e6584936af456ad4b819dcc52f27", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.12002562916939653, "ground_truth": 0}, {"key": "bc4992871e25e6584936af456ad4b819dcc52f27", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.03271312645745915, "ground_truth": 0}, {"key": "271416bf0f15c52a4417339de78dcecf378b3950", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.09203286027079656, "ground_truth": 0}, {"key": "271416bf0f15c52a4417339de78dcecf378b3950", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.14903530321442177, "ground_truth": 0}, {"key": "271416bf0f15c52a4417339de78dcecf378b3950", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.06418264470203146, "ground_truth": 0}, {"key": "271416bf0f15c52a4417339de78dcecf378b3950", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.14223189244884868, "ground_truth": 0}, {"key": "271416bf0f15c52a4417339de78dcecf378b3950", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.06465348836395009, "ground_truth": 0}, {"key": "0add6b43e18072837f0bef41031d6f92f740d625", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.04958902841703879, "ground_truth": 0}, {"key": "0add6b43e18072837f0bef41031d6f92f740d625", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.0775176605116036, "ground_truth": 0}, {"key": "0add6b43e18072837f0bef41031d6f92f740d625", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.3451052837504887, "ground_truth": 0}, {"key": "0add6b43e18072837f0bef41031d6f92f740d625", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.08756384815968771, "ground_truth": 0}, {"key": "0add6b43e18072837f0bef41031d6f92f740d625", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.1320661544033442, "ground_truth": 0}, {"key": "7060e3feb685bda7b5102e1cc8e9b35da37ca2a1", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.3998116501521699, "ground_truth": 0}, {"key": "7060e3feb685bda7b5102e1cc8e9b35da37ca2a1", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.11516223156746717, "ground_truth": 0}, {"key": "7060e3feb685bda7b5102e1cc8e9b35da37ca2a1", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.23934933039245376, "ground_truth": 0}, {"key": "7060e3feb685bda7b5102e1cc8e9b35da37ca2a1", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.17106118768044304, "ground_truth": 0}, {"key": "7060e3feb685bda7b5102e1cc8e9b35da37ca2a1", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.0910582843941265, "ground_truth": 0}, {"key": "04fbd3088e8610dd4d5bea709e7cc5ee3e53710d", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.5917232703941587, "ground_truth": 0}, {"key": "04fbd3088e8610dd4d5bea709e7cc5ee3e53710d", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.5097644102440383, "ground_truth": 0}, {"key": "04fbd3088e8610dd4d5bea709e7cc5ee3e53710d", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.267408166664605, "ground_truth": 0}, {"key": "04fbd3088e8610dd4d5bea709e7cc5ee3e53710d", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.22405545113025085, "ground_truth": 0}, {"key": "04fbd3088e8610dd4d5bea709e7cc5ee3e53710d", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.44360043673327715, "ground_truth": 0}, {"key": "b198f0356c0f0cb09aba4d7d5541dd7c5ce91678", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.20561504911309764, "ground_truth": 0}, {"key": "b198f0356c0f0cb09aba4d7d5541dd7c5ce91678", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.12506538794394945, "ground_truth": 0}, {"key": "b198f0356c0f0cb09aba4d7d5541dd7c5ce91678", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.2509127935155793, "ground_truth": 0}, {"key": "b198f0356c0f0cb09aba4d7d5541dd7c5ce91678", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.03718677514240097, "ground_truth": 0}, {"key": "b198f0356c0f0cb09aba4d7d5541dd7c5ce91678", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.1613202430507176, "ground_truth": 0}, {"key": "0f60442453e038c6bbe3aa525bedf2a97f459e04", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.5370413969781282, "ground_truth": 0}, {"key": "0f60442453e038c6bbe3aa525bedf2a97f459e04", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.3593641405893155, "ground_truth": 0}, {"key": "0f60442453e038c6bbe3aa525bedf2a97f459e04", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.6636689542980183, "ground_truth": 0}, {"key": "0f60442453e038c6bbe3aa525bedf2a97f459e04", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.3839877331787098, "ground_truth": 0}, {"key": "0f60442453e038c6bbe3aa525bedf2a97f459e04", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.5525397069191903, "ground_truth": 0}, {"key": "79b423b90af6b3381ebfa34a7382ca472bdb5b35", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.05165378401043237, "ground_truth": 0}, {"key": "79b423b90af6b3381ebfa34a7382ca472bdb5b35", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.10743747035386823, "ground_truth": 0}, {"key": "79b423b90af6b3381ebfa34a7382ca472bdb5b35", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.1949802230326805, "ground_truth": 0}, {"key": "79b423b90af6b3381ebfa34a7382ca472bdb5b35", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.3468730921268733, "ground_truth": 0}, {"key": "79b423b90af6b3381ebfa34a7382ca472bdb5b35", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.12678516910114912, "ground_truth": 0}, {"key": "3e5a3a2dddee7ebebe57c12d0ace97a24cbabd72", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.1597410190378626, "ground_truth": 0}, {"key": "3e5a3a2dddee7ebebe57c12d0ace97a24cbabd72", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.18535662042366594, "ground_truth": 0}, {"key": "3e5a3a2dddee7ebebe57c12d0ace97a24cbabd72", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.554470465553356, "ground_truth": 0}, {"key": "3e5a3a2dddee7ebebe57c12d0ace97a24cbabd72", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.4474603014550604, "ground_truth": 0}, {"key": "3e5a3a2dddee7ebebe57c12d0ace97a24cbabd72", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.1699562282615761, "ground_truth": 0}, {"key": "c623e4914c04811d354fa137e3bf7a00980ef7d7", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.040540737138337786, "ground_truth": 0}, {"key": "c623e4914c04811d354fa137e3bf7a00980ef7d7", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.09807932655725062, "ground_truth": 0}, {"key": "c623e4914c04811d354fa137e3bf7a00980ef7d7", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.06052939154380376, "ground_truth": 0}, {"key": "c623e4914c04811d354fa137e3bf7a00980ef7d7", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.05399884223322207, "ground_truth": 0}, {"key": "c623e4914c04811d354fa137e3bf7a00980ef7d7", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.031143831658113616, "ground_truth": 0}, {"key": "d5ef1fb6f2df20e46fb032b9e318bc8555283e78", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.07107366660490066, "ground_truth": 0}, {"key": "d5ef1fb6f2df20e46fb032b9e318bc8555283e78", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.20689406691021617, "ground_truth": 0}, {"key": "d5ef1fb6f2df20e46fb032b9e318bc8555283e78", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.05623634575271672, "ground_truth": 0}, {"key": "d5ef1fb6f2df20e46fb032b9e318bc8555283e78", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.1001722248096003, "ground_truth": 0}, {"key": "d5ef1fb6f2df20e46fb032b9e318bc8555283e78", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.2422056355019495, "ground_truth": 0}, {"key": "e1a36c50adadc5db9ffe6fd2c5e275d522902193", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.06754669264578508, "ground_truth": 0}, {"key": "e1a36c50adadc5db9ffe6fd2c5e275d522902193", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.1721718485062528, "ground_truth": 0}, {"key": "e1a36c50adadc5db9ffe6fd2c5e275d522902193", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.07477004963030533, "ground_truth": 0}, {"key": "e1a36c50adadc5db9ffe6fd2c5e275d522902193", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.0875638447937179, "ground_truth": 0}, {"key": "e1a36c50adadc5db9ffe6fd2c5e275d522902193", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.09877258960386055, "ground_truth": 0}, {"key": "bad69c9a3c7d84a4717705a3063dd7367243772b", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.0414622730494507, "ground_truth": 0}, {"key": "bad69c9a3c7d84a4717705a3063dd7367243772b", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.4378234946145639, "ground_truth": 0}, {"key": "bad69c9a3c7d84a4717705a3063dd7367243772b", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.050330632906809204, "ground_truth": 0}, {"key": "bad69c9a3c7d84a4717705a3063dd7367243772b", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.11357958447435132, "ground_truth": 0}, {"key": "bad69c9a3c7d84a4717705a3063dd7367243772b", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.08269734013835857, "ground_truth": 0}, {"key": "4b40ad1f0e59b139e9a1466859ee08a048ca8d2c", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.12678516532155013, "ground_truth": 0}, {"key": "4b40ad1f0e59b139e9a1466859ee08a048ca8d2c", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.19620941804182396, "ground_truth": 0}, {"key": "4b40ad1f0e59b139e9a1466859ee08a048ca8d2c", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.30735801133303847, "ground_truth": 0}, {"key": "4b40ad1f0e59b139e9a1466859ee08a048ca8d2c", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.06008664833597976, "ground_truth": 0}, {"key": "4b40ad1f0e59b139e9a1466859ee08a048ca8d2c", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.1052105369085632, "ground_truth": 0}, {"key": "c17a30b4c0f8f58e3afa6279a39470f65a179f6b", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.2845760104567129, "ground_truth": 0}, {"key": "c17a30b4c0f8f58e3afa6279a39470f65a179f6b", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.198064181639725, "ground_truth": 0}, {"key": "c17a30b4c0f8f58e3afa6279a39470f65a179f6b", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.31742627418582475, "ground_truth": 0}, {"key": "c17a30b4c0f8f58e3afa6279a39470f65a179f6b", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.2553436546621817, "ground_truth": 0}, {"key": "c17a30b4c0f8f58e3afa6279a39470f65a179f6b", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.5964331225870575, "ground_truth": 0}, {"key": "6f579aad2d1f601b17e01057cd4b5e4942627230", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.023870833902769086, "ground_truth": 0}, {"key": "6f579aad2d1f601b17e01057cd4b5e4942627230", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.08945460359288862, "ground_truth": 0}, {"key": "6f579aad2d1f601b17e01057cd4b5e4942627230", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.025957357934574057, "ground_truth": 0}, {"key": "6f579aad2d1f601b17e01057cd4b5e4942627230", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.047958101993197166, "ground_truth": 0}, {"key": "6f579aad2d1f601b17e01057cd4b5e4942627230", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.10017223176954483, "ground_truth": 0}, {"key": "7551f8e13485bb1738c16eccad343a14a47b2903", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.05813159138751143, "ground_truth": 0}, {"key": "7551f8e13485bb1738c16eccad343a14a47b2903", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.07055959299732359, "ground_truth": 0}, {"key": "7551f8e13485bb1738c16eccad343a14a47b2903", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.041307304667398605, "ground_truth": 0}, {"key": "7551f8e13485bb1738c16eccad343a14a47b2903", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.07807816194603806, "ground_truth": 0}, {"key": "7551f8e13485bb1738c16eccad343a14a47b2903", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.07369627158339734, "ground_truth": 0}, {"key": "257d8d38863175ec9401d0532963fb71a47f0734", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.4707366129218222, "ground_truth": 0}, {"key": "257d8d38863175ec9401d0532963fb71a47f0734", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.7534666613491644, "ground_truth": 0}, {"key": "257d8d38863175ec9401d0532963fb71a47f0734", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.1602660340792305, "ground_truth": 0}, {"key": "257d8d38863175ec9401d0532963fb71a47f0734", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.3174262857526333, "ground_truth": 0}, {"key": "257d8d38863175ec9401d0532963fb71a47f0734", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.2254165993615569, "ground_truth": 0}, {"key": "aa596e10dfe78dd875a7e15bfd53138bc8bde471", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.20817893128293707, "ground_truth": 0}, {"key": "aa596e10dfe78dd875a7e15bfd53138bc8bde471", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.5486735031834596, "ground_truth": 0}, {"key": "aa596e10dfe78dd875a7e15bfd53138bc8bde471", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.4726834586145301, "ground_truth": 0}, {"key": "aa596e10dfe78dd875a7e15bfd53138bc8bde471", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.08663206481811501, "ground_truth": 0}, {"key": "aa596e10dfe78dd875a7e15bfd53138bc8bde471", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.17384852293707923, "ground_truth": 0}, {"key": "a0dff972172125f32b79977a47b0d250be8f71e4", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.3486451513050262, "ground_truth": 0}, {"key": "a0dff972172125f32b79977a47b0d250be8f71e4", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.6627964618114457, "ground_truth": 0}, {"key": "a0dff972172125f32b79977a47b0d250be8f71e4", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.3056973261668548, "ground_truth": 0}, {"key": "a0dff972172125f32b79977a47b0d250be8f71e4", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.2885691184937827, "ground_truth": 0}, {"key": "a0dff972172125f32b79977a47b0d250be8f71e4", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.8736466527678716, "ground_truth": 0}, {"key": "faac3a6337907b1552b7068c8701cae665c4885c", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.23091974705289972, "ground_truth": 0}, {"key": "faac3a6337907b1552b7068c8701cae665c4885c", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.09073548570958347, "ground_truth": 0}, {"key": "faac3a6337907b1552b7068c8701cae665c4885c", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.18126320717410946, "ground_truth": 0}, {"key": "faac3a6337907b1552b7068c8701cae665c4885c", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.19314737888989136, "ground_truth": 0}, {"key": "faac3a6337907b1552b7068c8701cae665c4885c", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.1789558897045107, "ground_truth": 0}, {"key": "c741b211364d761605050776064a506d24378d10", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.06632686948110816, "ground_truth": 0}, {"key": "c741b211364d761605050776064a506d24378d10", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.09534946297833227, "ground_truth": 0}, {"key": "c741b211364d761605050776064a506d24378d10", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.06164961792059204, "ground_truth": 0}, {"key": "c741b211364d761605050776064a506d24378d10", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.08389038516598119, "ground_truth": 0}, {"key": "c741b211364d761605050776064a506d24378d10", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.04995852452292293, "ground_truth": 0}, {"key": "a062b8ba08369be2364a863020a28de63a3cbf86", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.07585817713663487, "ground_truth": 0}, {"key": "a062b8ba08369be2364a863020a28de63a3cbf86", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.10374862672694508, "ground_truth": 0}, {"key": "a062b8ba08369be2364a863020a28de63a3cbf86", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.05520869034388873, "ground_truth": 0}, {"key": "a062b8ba08369be2364a863020a28de63a3cbf86", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.09170696566917755, "ground_truth": 0}, {"key": "a062b8ba08369be2364a863020a28de63a3cbf86", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.05184546643830607, "ground_truth": 0}, {"key": "f11102404d23702fe398b1d690d13418703e617a", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.4513265182804645, "ground_truth": 0}, {"key": "f11102404d23702fe398b1d690d13418703e617a", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.4339814815789988, "ground_truth": 0}, {"key": "f11102404d23702fe398b1d690d13418703e617a", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.41489884136668076, "ground_truth": 0}, {"key": "f11102404d23702fe398b1d690d13418703e617a", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.2712517130558323, "ground_truth": 0}, {"key": "f11102404d23702fe398b1d690d13418703e617a", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.6001883534440416, "ground_truth": 0}, {"key": "62481fda7e7b9714b994617909349550707fe8a7", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.017986210768928135, "ground_truth": 0}, {"key": "62481fda7e7b9714b994617909349550707fe8a7", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.04724971324713042, "ground_truth": 0}, {"key": "62481fda7e7b9714b994617909349550707fe8a7", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.04977344635127597, "ground_truth": 0}, {"key": "62481fda7e7b9714b994617909349550707fe8a7", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.021368888394979677, "ground_truth": 0}, {"key": "62481fda7e7b9714b994617909349550707fe8a7", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.12421300854142159, "ground_truth": 0}, {"key": "13943ef2d9c3b737c9a900f0cdb32a9c39121e6f", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.620621594557311, "ground_truth": 0}, {"key": "13943ef2d9c3b737c9a900f0cdb32a9c39121e6f", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.18359362850442143, "ground_truth": 0}, {"key": "13943ef2d9c3b737c9a900f0cdb32a9c39121e6f", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.24944723356416024, "ground_truth": 0}, {"key": "13943ef2d9c3b737c9a900f0cdb32a9c39121e6f", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.5253688112365388, "ground_truth": 0}, {"key": "13943ef2d9c3b737c9a900f0cdb32a9c39121e6f", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.2829881202638054, "ground_truth": 0}, {"key": "0c25e0cd62589fde1b378606febbcc5a2bafc770", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.29421497083210574, "ground_truth": 0}, {"key": "0c25e0cd62589fde1b378606febbcc5a2bafc770", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.1311732216854897, "ground_truth": 0}, {"key": "0c25e0cd62589fde1b378606febbcc5a2bafc770", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.3775406665253862, "ground_truth": 0}, {"key": "0c25e0cd62589fde1b378606febbcc5a2bafc770", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.27512972781543776, "ground_truth": 0}, {"key": "0c25e0cd62589fde1b378606febbcc5a2bafc770", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.13660839723947102, "ground_truth": 0}, {"key": "a86bc16fad35d84e988af4cc64bf14877337d47e", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.16667540276618992, "ground_truth": 0}, {"key": "a86bc16fad35d84e988af4cc64bf14877337d47e", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.32423538952178593, "ground_truth": 0}, {"key": "a86bc16fad35d84e988af4cc64bf14877337d47e", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.1431876994878729, "ground_truth": 0}, {"key": "a86bc16fad35d84e988af4cc64bf14877337d47e", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.10230470148623637, "ground_truth": 0}, {"key": "a86bc16fad35d84e988af4cc64bf14877337d47e", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.3684056928991848, "ground_truth": 0}, {"key": "0f937bcc8cd07bab2d5aa9a4492d3c2430063b67", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.06278920645395282, "ground_truth": 0}, {"key": "0f937bcc8cd07bab2d5aa9a4492d3c2430063b67", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.042403828936412, "ground_truth": 0}, {"key": "0f937bcc8cd07bab2d5aa9a4492d3c2430063b67", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.10447732377993724, "ground_truth": 0}, {"key": "0f937bcc8cd07bab2d5aa9a4492d3c2430063b67", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.060975185494442405, "ground_truth": 0}, {"key": "0f937bcc8cd07bab2d5aa9a4492d3c2430063b67", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.06418264408140448, "ground_truth": 0}, {"key": "a6c0617d92807f05f02d767261c45b616382e499", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.06828854096116381, "ground_truth": 0}, {"key": "a6c0617d92807f05f02d767261c45b616382e499", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.20370753151486157, "ground_truth": 0}, {"key": "a6c0617d92807f05f02d767261c45b616382e499", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.041307306749086406, "ground_truth": 0}, {"key": "a6c0617d92807f05f02d767261c45b616382e499", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.040845718005758654, "ground_truth": 0}, {"key": "a6c0617d92807f05f02d767261c45b616382e499", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.12635334735581583, "ground_truth": 0}, {"key": "4f45a0576d353fa9b5b9d1c8e3cc0e6a1cd4897b", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.6548947050637901, "ground_truth": 0}, {"key": "4f45a0576d353fa9b5b9d1c8e3cc0e6a1cd4897b", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.5621765123853909, "ground_truth": 0}, {"key": "4f45a0576d353fa9b5b9d1c8e3cc0e6a1cd4897b", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.30569731636897435, "ground_truth": 0}, {"key": "4f45a0576d353fa9b5b9d1c8e3cc0e6a1cd4897b", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.6740504715079982, "ground_truth": 0}, {"key": "4f45a0576d353fa9b5b9d1c8e3cc0e6a1cd4897b", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.41300355563685187, "ground_truth": 0}, {"key": "f6d43a207c2b3c48e787087b345c23d2fb1dc92f", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.09009299591674354, "ground_truth": 0}, {"key": "f6d43a207c2b3c48e787087b345c23d2fb1dc92f", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.33807714484035334, "ground_truth": 0}, {"key": "f6d43a207c2b3c48e787087b345c23d2fb1dc92f", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.1955940876170141, "ground_truth": 0}, {"key": "f6d43a207c2b3c48e787087b345c23d2fb1dc92f", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.2829881264584742, "ground_truth": 0}, {"key": "f6d43a207c2b3c48e787087b345c23d2fb1dc92f", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.17553806979903389, "ground_truth": 0}, {"key": "e0127487aee3a00fe164d72eb697221079518471", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.6297746286226023, "ground_truth": 0}, {"key": "e0127487aee3a00fe164d72eb697221079518471", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.33458943290871007, "ground_truth": 0}, {"key": "e0127487aee3a00fe164d72eb697221079518471", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.6297746209352635, "ground_truth": 0}, {"key": "e0127487aee3a00fe164d72eb697221079518471", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.3056973122841526, "ground_truth": 0}, {"key": "e0127487aee3a00fe164d72eb697221079518471", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.5428632718645526, "ground_truth": 0}, {"key": "2f3af8decce1c0a6cd22b21df96acd40b14bb62b", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.18010666514127208, "ground_truth": 0}, {"key": "2f3af8decce1c0a6cd22b21df96acd40b14bb62b", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.0528140255519219, "ground_truth": 0}, {"key": "2f3af8decce1c0a6cd22b21df96acd40b14bb62b", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.08151975178197146, "ground_truth": 0}, {"key": "2f3af8decce1c0a6cd22b21df96acd40b14bb62b", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.12852513440969696, "ground_truth": 0}, {"key": "2f3af8decce1c0a6cd22b21df96acd40b14bb62b", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.09602549049567183, "ground_truth": 0}, {"key": "13a366f303e6ea2f07c353a9f5fb49a44840f808", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.1001722217232285, "ground_truth": 0}, {"key": "13a366f303e6ea2f07c353a9f5fb49a44840f808", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.05223085527027779, "ground_truth": 0}, {"key": "13a366f303e6ea2f07c353a9f5fb49a44840f808", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.12336561494291055, "ground_truth": 0}, {"key": "13a366f303e6ea2f07c353a9f5fb49a44840f808", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.09739039947972584, "ground_truth": 0}, {"key": "13a366f303e6ea2f07c353a9f5fb49a44840f808", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.16885695455358338, "ground_truth": 0}, {"key": "ee36a8b5db09b9e9a6d462116539ffc095d5c017", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.3380771309826738, "ground_truth": 0}, {"key": "ee36a8b5db09b9e9a6d462116539ffc095d5c017", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.10230469948161712, "ground_truth": 0}, {"key": "ee36a8b5db09b9e9a6d462116539ffc095d5c017", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.1356895534881951, "ground_truth": 0}, {"key": "ee36a8b5db09b9e9a6d462116539ffc095d5c017", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.1112412138072058, "ground_truth": 0}, {"key": "ee36a8b5db09b9e9a6d462116539ffc095d5c017", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.16995622849608097, "ground_truth": 0}, {"key": "d3b3bcf90226a694361cb27f1a4d481c79b7368a", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.12002563442139341, "ground_truth": 0}, {"key": "d3b3bcf90226a694361cb27f1a4d481c79b7368a", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.17667161064961392, "ground_truth": 0}, {"key": "d3b3bcf90226a694361cb27f1a4d481c79b7368a", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.16132024426246547, "ground_truth": 0}, {"key": "d3b3bcf90226a694361cb27f1a4d481c79b7368a", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.3208213145456894, "ground_truth": 0}, {"key": "d3b3bcf90226a694361cb27f1a4d481c79b7368a", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.16238002683556732, "ground_truth": 0}, {"key": "e5e837f2cc75fc44ebf826822aa4c9dc59344b8b", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.1384617882859476, "ground_truth": 0}, {"key": "e5e837f2cc75fc44ebf826822aa4c9dc59344b8b", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.22270013915345677, "ground_truth": 0}, {"key": "e5e837f2cc75fc44ebf826822aa4c9dc59344b8b", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.05014425370935107, "ground_truth": 0}, {"key": "e5e837f2cc75fc44ebf826822aa4c9dc59344b8b", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.027585283252612974, "ground_truth": 0}, {"key": "e5e837f2cc75fc44ebf826822aa4c9dc59344b8b", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.14128141973433658, "ground_truth": 0}, {"key": "1317a869cc1d6d534a93eaad67fb6550aa155ae6", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.10818895375110121, "ground_truth": 0}, {"key": "1317a869cc1d6d534a93eaad67fb6550aa155ae6", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.13028542701219806, "ground_truth": 0}, {"key": "1317a869cc1d6d534a93eaad67fb6550aa155ae6", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.06705628794364667, "ground_truth": 0}, {"key": "1317a869cc1d6d534a93eaad67fb6550aa155ae6", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.11279540613352419, "ground_truth": 0}, {"key": "1317a869cc1d6d534a93eaad67fb6550aa155ae6", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.21733751046968297, "ground_truth": 0}, {"key": "f856ca4cd15992e0e88ae9113bf31b2a5ab55072", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.5136684639576923, "ground_truth": 0}, {"key": "f856ca4cd15992e0e88ae9113bf31b2a5ab55072", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.27982848948778133, "ground_truth": 0}, {"key": "f856ca4cd15992e0e88ae9113bf31b2a5ab55072", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.2553436380477536, "ground_truth": 0}, {"key": "f856ca4cd15992e0e88ae9113bf31b2a5ab55072", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.2173375208559063, "ground_truth": 0}, {"key": "f856ca4cd15992e0e88ae9113bf31b2a5ab55072", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.05856082926552294, "ground_truth": 0}, {"key": "438e8eaa1c64cb59288f9954355d0100181d19a2", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.17667160762351417, "ground_truth": 0}, {"key": "438e8eaa1c64cb59288f9954355d0100181d19a2", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.008445626854466724, "ground_truth": 0}, {"key": "438e8eaa1c64cb59288f9954355d0100181d19a2", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.08945460425823888, "ground_truth": 0}, {"key": "438e8eaa1c64cb59288f9954355d0100181d19a2", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.10743746612991811, "ground_truth": 0}, {"key": "438e8eaa1c64cb59288f9954355d0100181d19a2", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.05541278998468826, "ground_truth": 0}, {"key": "470618f9fd48a5d134a44b5de166b625f596a0b3", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.3157359740266273, "ground_truth": 0}, {"key": "470618f9fd48a5d134a44b5de166b625f596a0b3", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.861071565190519, "ground_truth": 0}, {"key": "470618f9fd48a5d134a44b5de166b625f596a0b3", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.8860265390286306, "ground_truth": 0}, {"key": "470618f9fd48a5d134a44b5de166b625f596a0b3", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.5794004109380374, "ground_truth": 0}, {"key": "470618f9fd48a5d134a44b5de166b625f596a0b3", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.7325918262785438, "ground_truth": 0}, {"key": "751e8f720d24c57e79cf63d9a3f72cd80c5d9619", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.018475594772874165, "ground_truth": 0}, {"key": "751e8f720d24c57e79cf63d9a3f72cd80c5d9619", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.026963501004997007, "ground_truth": 0}, {"key": "751e8f720d24c57e79cf63d9a3f72cd80c5d9619", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.01717670858541034, "ground_truth": 0}, {"key": "751e8f720d24c57e79cf63d9a3f72cd80c5d9619", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.008156249200285997, "ground_truth": 0}, {"key": "751e8f720d24c57e79cf63d9a3f72cd80c5d9619", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.03993731722432838, "ground_truth": 0}, {"key": "6a985a1090f146976d33c8b33342320a65a50211", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.05834583961838712, "ground_truth": 0}, {"key": "6a985a1090f146976d33c8b33342320a65a50211", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.08756384025326211, "ground_truth": 0}, {"key": "6a985a1090f146976d33c8b33342320a65a50211", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.12940273520208098, "ground_truth": 0}, {"key": "6a985a1090f146976d33c8b33342320a65a50211", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.08632347831463308, "ground_truth": 0}, {"key": "6a985a1090f146976d33c8b33342320a65a50211", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.08449276056406987, "ground_truth": 0}, {"key": "4640d2f968f31bcf384d8253e055611b10f4a38b", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.41300356554164397, "ground_truth": 0}, {"key": "4640d2f968f31bcf384d8253e055611b10f4a38b", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.33807715081106376, "ground_truth": 0}, {"key": "4640d2f968f31bcf384d8253e055611b10f4a38b", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.3276683035466236, "ground_truth": 0}, {"key": "4640d2f968f31bcf384d8253e055611b10f4a38b", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.6113819848174119, "ground_truth": 0}, {"key": "4640d2f968f31bcf384d8253e055611b10f4a38b", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.6224593274511794, "ground_truth": 0}, {"key": "22e0c9ba3465840583a5fd79714d2f7663c7e3a1", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.03649376886361169, "ground_truth": 0}, {"key": "22e0c9ba3465840583a5fd79714d2f7663c7e3a1", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.09739040377487782, "ground_truth": 0}, {"key": "22e0c9ba3465840583a5fd79714d2f7663c7e3a1", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.10266401053838203, "ground_truth": 0}, {"key": "22e0c9ba3465840583a5fd79714d2f7663c7e3a1", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.03333682414672425, "ground_truth": 0}, {"key": "22e0c9ba3465840583a5fd79714d2f7663c7e3a1", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.021368885738236202, "ground_truth": 0}, {"key": "10dafcc21761c60f8fc5bd832daf8f21cf0fc66d", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.1108555941000534, "ground_truth": 0}, {"key": "10dafcc21761c60f8fc5bd832daf8f21cf0fc66d", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.3468730759626693, "ground_truth": 0}, {"key": "10dafcc21761c60f8fc5bd832daf8f21cf0fc66d", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.20055767657593038, "ground_truth": 0}, {"key": "10dafcc21761c60f8fc5bd832daf8f21cf0fc66d", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.5156199280439968, "ground_truth": 0}, {"key": "10dafcc21761c60f8fc5bd832daf8f21cf0fc66d", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.15817435669780422, "ground_truth": 0}, {"key": "75da85a72e0028e1b07c65f6b771a1eaa20b4e04", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.09334687803666486, "ground_truth": 0}, {"key": "75da85a72e0028e1b07c65f6b771a1eaa20b4e04", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.181263215004222, "ground_truth": 0}, {"key": "75da85a72e0028e1b07c65f6b771a1eaa20b4e04", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.09568693830790055, "ground_truth": 0}, {"key": "75da85a72e0028e1b07c65f6b771a1eaa20b4e04", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.07751765725232151, "ground_truth": 0}, {"key": "75da85a72e0028e1b07c65f6b771a1eaa20b4e04", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.032961244253515376, "ground_truth": 0}, {"key": "9166b4c77e919f7a7cc457f9df981512dea3694f", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.13432105151060256, "ground_truth": 0}, {"key": "9166b4c77e919f7a7cc457f9df981512dea3694f", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.1645164573654164, "ground_truth": 0}, {"key": "9166b4c77e919f7a7cc457f9df981512dea3694f", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.27669051870254735, "ground_truth": 0}, {"key": "9166b4c77e919f7a7cc457f9df981512dea3694f", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.7431680110427896, "ground_truth": 0}, {"key": "9166b4c77e919f7a7cc457f9df981512dea3694f", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.0641826410739983, "ground_truth": 0}, {"key": "81e50c6cdbea4e55af6307d653135ef395b6d7fe", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.6388352862707178, "ground_truth": 0}, {"key": "81e50c6cdbea4e55af6307d653135ef395b6d7fe", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.5794004119176283, "ground_truth": 0}, {"key": "81e50c6cdbea4e55af6307d653135ef395b6d7fe", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.6388352560218081, "ground_truth": 0}, {"key": "81e50c6cdbea4e55af6307d653135ef395b6d7fe", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.7759445542287929, "ground_truth": 0}, {"key": "81e50c6cdbea4e55af6307d653135ef395b6d7fe", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.6548947362655654, "ground_truth": 0}, {"key": "59fa6c3439d216272cc845d35627f8eb11b08a6d", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.6057990472016717, "ground_truth": 0}, {"key": "59fa6c3439d216272cc845d35627f8eb11b08a6d", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.5136684631748412, "ground_truth": 0}, {"key": "59fa6c3439d216272cc845d35627f8eb11b08a6d", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.4464947000563857, "ground_truth": 0}, {"key": "59fa6c3439d216272cc845d35627f8eb11b08a6d", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.5851011455941676, "ground_truth": 0}, {"key": "59fa6c3439d216272cc845d35627f8eb11b08a6d", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.2436424609456951, "ground_truth": 0}, {"key": "2eff3ba44cfaefbff89ebc764828ae9e4d477c9b", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.6859494439931958, "ground_truth": 0}, {"key": "2eff3ba44cfaefbff89ebc764828ae9e4d477c9b", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.5350984222295436, "ground_truth": 0}, {"key": "2eff3ba44cfaefbff89ebc764828ae9e4d477c9b", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.3998116099965938, "ground_truth": 0}, {"key": "2eff3ba44cfaefbff89ebc764828ae9e4d477c9b", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.3090237126592436, "ground_truth": 0}, {"key": "2eff3ba44cfaefbff89ebc764828ae9e4d477c9b", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.6076631692275033, "ground_truth": 0}, {"key": "74698ee383888faf5a49b32ecb8211b888270b76", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.08509904071307173, "ground_truth": 0}, {"key": "74698ee383888faf5a49b32ecb8211b888270b76", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.2735743957640681, "ground_truth": 0}, {"key": "74698ee383888faf5a49b32ecb8211b888270b76", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.09877258618882229, "ground_truth": 0}, {"key": "74698ee383888faf5a49b32ecb8211b888270b76", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.11516223438667737, "ground_truth": 0}, {"key": "74698ee383888faf5a49b32ecb8211b888270b76", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.03461884016760587, "ground_truth": 0}, {"key": "79a6d24f452d8c1cef47ab224fd2083b0d08324c", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.5195213303581626, "ground_truth": 0}, {"key": "79a6d24f452d8c1cef47ab224fd2083b0d08324c", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.25534363563517265, "ground_truth": 0}, {"key": "79a6d24f452d8c1cef47ab224fd2083b0d08324c", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.43590153581202984, "ground_truth": 0}, {"key": "79a6d24f452d8c1cef47ab224fd2083b0d08324c", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.4746311764293151, "ground_truth": 0}, {"key": "79a6d24f452d8c1cef47ab224fd2083b0d08324c", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.23863890483120276, "ground_truth": 0}, {"key": "50f2041a2bed7f316d3254192c4158095eeec2e9", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.41679664652398757, "ground_truth": 0}, {"key": "50f2041a2bed7f316d3254192c4158095eeec2e9", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.42823338547831213, "ground_truth": 0}, {"key": "50f2041a2bed7f316d3254192c4158095eeec2e9", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.25386101417601525, "ground_truth": 0}, {"key": "50f2041a2bed7f316d3254192c4158095eeec2e9", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.4824291071346028, "ground_truth": 0}, {"key": "50f2041a2bed7f316d3254192c4158095eeec2e9", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.31742627892672626, "ground_truth": 0}, {"key": "de6ed8db6d639706f2c5015c699fc578e4aa43ec", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.11085559743000616, "ground_truth": 0}, {"key": "de6ed8db6d639706f2c5015c699fc578e4aa43ec", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.15610490782786726, "ground_truth": 0}, {"key": "de6ed8db6d639706f2c5015c699fc578e4aa43ec", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.06465348852507201, "ground_truth": 0}, {"key": "de6ed8db6d639706f2c5015c699fc578e4aa43ec", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.09401018458495543, "ground_truth": 0}, {"key": "de6ed8db6d639706f2c5015c699fc578e4aa43ec", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.09739039903753169, "ground_truth": 0}, {"key": "8abb66a9697a8c59348fcc79de126691e394bded", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.24220563654139649, "ground_truth": 0}, {"key": "8abb66a9697a8c59348fcc79de126691e394bded", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.7704647885996425, "ground_truth": 0}, {"key": "8abb66a9697a8c59348fcc79de126691e394bded", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.7341195249093981, "ground_truth": 0}, {"key": "8abb66a9697a8c59348fcc79de126691e394bded", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.6370308037189161, "ground_truth": 0}, {"key": "8abb66a9697a8c59348fcc79de126691e394bded", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.49023562811454036, "ground_truth": 0}, {"key": "11ec3be451b57e4312b44eeabb3ae441435c662e", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.0483160736254827, "ground_truth": 0}, {"key": "11ec3be451b57e4312b44eeabb3ae441435c662e", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.02655657139903866, "ground_truth": 0}, {"key": "11ec3be451b57e4312b44eeabb3ae441435c662e", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.042562732002913634, "ground_truth": 0}, {"key": "11ec3be451b57e4312b44eeabb3ae441435c662e", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.01987071478185293, "ground_truth": 0}, {"key": "11ec3be451b57e4312b44eeabb3ae441435c662e", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.082697340407873, "ground_truth": 0}, {"key": "eed527dece78deffed54a7cdd8516c4d57a90011", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.9846346577520189, "ground_truth": 0}, {"key": "eed527dece78deffed54a7cdd8516c4d57a90011", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.8428631499418092, "ground_truth": 0}, {"key": "eed527dece78deffed54a7cdd8516c4d57a90011", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.9588471142943412, "ground_truth": 0}, {"key": "eed527dece78deffed54a7cdd8516c4d57a90011", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.8816149067795378, "ground_truth": 0}, {"key": "eed527dece78deffed54a7cdd8516c4d57a90011", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.6636689611401947, "ground_truth": 0}, {"key": "803c0dc8b3d2eb528fd084b613dfc29d98151d72", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.8250265378474452, "ground_truth": 0}, {"key": "803c0dc8b3d2eb528fd084b613dfc29d98151d72", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.7279754466876992, "ground_truth": 0}, {"key": "803c0dc8b3d2eb528fd084b613dfc29d98151d72", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.5888891509057322, "ground_truth": 0}, {"key": "803c0dc8b3d2eb528fd084b613dfc29d98151d72", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.7264256013266362, "ground_truth": 0}, {"key": "803c0dc8b3d2eb528fd084b613dfc29d98151d72", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.7498206970601686, "ground_truth": 0}, {"key": "d4fb4cca753c0f5586bd93bb124b0491711396d9", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.051845468453175315, "ground_truth": 0}, {"key": "d4fb4cca753c0f5586bd93bb124b0491711396d9", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.21337718233232367, "ground_truth": 0}, {"key": "d4fb4cca753c0f5586bd93bb124b0491711396d9", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.04434857928037961, "ground_truth": 0}, {"key": "d4fb4cca753c0f5586bd93bb124b0491711396d9", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.11047114662586699, "ground_truth": 0}, {"key": "d4fb4cca753c0f5586bd93bb124b0491711396d9", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.20055768179751365, "ground_truth": 0}, {"key": "723443b1c16e2276a1aa03259a600044e86c2538", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.016785491124363363, "ground_truth": 0}, {"key": "723443b1c16e2276a1aa03259a600044e86c2538", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.028544152987924985, "ground_truth": 0}, {"key": "723443b1c16e2276a1aa03259a600044e86c2538", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.015723990500562935, "ground_truth": 0}, {"key": "723443b1c16e2276a1aa03259a600044e86c2538", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.009340024741931024, "ground_truth": 0}, {"key": "723443b1c16e2276a1aa03259a600044e86c2538", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.06371499490646634, "ground_truth": 0}, {"key": "b30a8f4dbb4f8375a8a9c2ccb4f658cc66dca0f5", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.6566582520091332, "ground_truth": 0}, {"key": "b30a8f4dbb4f8375a8a9c2ccb4f658cc66dca0f5", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.2974699484714712, "ground_truth": 0}, {"key": "b30a8f4dbb4f8375a8a9c2ccb4f658cc66dca0f5", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.5175709003149204, "ground_truth": 0}, {"key": "b30a8f4dbb4f8375a8a9c2ccb4f658cc66dca0f5", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.34334173119943545, "ground_truth": 0}, {"key": "b30a8f4dbb4f8375a8a9c2ccb4f658cc66dca0f5", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.19806417223797101, "ground_truth": 0}, {"key": "f874dc1da36d2c45a65f78dc0dc9dcdf5846c3c9", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.6352224427049072, "ground_truth": 0}, {"key": "f874dc1da36d2c45a65f78dc0dc9dcdf5846c3c9", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.876634376703169, "ground_truth": 0}, {"key": "f874dc1da36d2c45a65f78dc0dc9dcdf5846c3c9", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.5964331187473041, "ground_truth": 0}, {"key": "f874dc1da36d2c45a65f78dc0dc9dcdf5846c3c9", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.3090237111096041, "ground_truth": 0}, {"key": "f874dc1da36d2c45a65f78dc0dc9dcdf5846c3c9", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.6095241691458575, "ground_truth": 0}, {"key": "60fc2801c429858cc0a87e547f1c30e34a7a96f3", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.06828853776257005, "ground_truth": 0}, {"key": "60fc2801c429858cc0a87e547f1c30e34a7a96f3", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.011823395064971338, "ground_truth": 0}, {"key": "60fc2801c429858cc0a87e547f1c30e34a7a96f3", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.048857778904698494, "ground_truth": 0}, {"key": "60fc2801c429858cc0a87e547f1c30e34a7a96f3", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.02120611962129362, "ground_truth": 0}, {"key": "60fc2801c429858cc0a87e547f1c30e34a7a96f3", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.1721718478613986, "ground_truth": 0}, {"key": "d885b755dab03a11c7e3b19455b82859a6e1f76b", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.12043880972150654, "ground_truth": 0}, {"key": "d885b755dab03a11c7e3b19455b82859a6e1f76b", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.3328523469229765, "ground_truth": 0}, {"key": "d885b755dab03a11c7e3b19455b82859a6e1f76b", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.15559098979245128, "ground_truth": 0}, {"key": "d885b755dab03a11c7e3b19455b82859a6e1f76b", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.18952110237373404, "ground_truth": 0}, {"key": "d885b755dab03a11c7e3b19455b82859a6e1f76b", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.21469141098368072, "ground_truth": 0}, {"key": "9ce486aae2ad61c78b2e44d2617276a470c9f600", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.567936607429026, "ground_truth": 0}, {"key": "9ce486aae2ad61c78b2e44d2617276a470c9f600", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.7563575377753778, "ground_truth": 0}, {"key": "9ce486aae2ad61c78b2e44d2617276a470c9f600", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.6057990608406335, "ground_truth": 0}, {"key": "9ce486aae2ad61c78b2e44d2617276a470c9f600", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.49218813952760726, "ground_truth": 0}, {"key": "9ce486aae2ad61c78b2e44d2617276a470c9f600", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.710628295748554, "ground_truth": 0}, {"key": "162e54974cad1d0e067a97e37175951c26f13a0e", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.33111974339248906, "ground_truth": 0}, {"key": "162e54974cad1d0e067a97e37175951c26f13a0e", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.16026603240596085, "ground_truth": 0}, {"key": "162e54974cad1d0e067a97e37175951c26f13a0e", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.2974699369144755, "ground_truth": 0}, {"key": "162e54974cad1d0e067a97e37175951c26f13a0e", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.895887587784734, "ground_truth": 0}, {"key": "162e54974cad1d0e067a97e37175951c26f13a0e", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.575588035195982, "ground_truth": 0}, {"key": "03a0cef9c902928979ef731616fb96bd1fb10f9f", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.7718435020399628, "ground_truth": 0}, {"key": "03a0cef9c902928979ef731616fb96bd1fb10f9f", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.7154239681422205, "ground_truth": 0}, {"key": "03a0cef9c902928979ef731616fb96bd1fb10f9f", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.8128673094841916, "ground_truth": 0}, {"key": "03a0cef9c902928979ef731616fb96bd1fb10f9f", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.7279754284129808, "ground_truth": 0}, {"key": "03a0cef9c902928979ef731616fb96bd1fb10f9f", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.7634837691475428, "ground_truth": 0}, {"key": "6f64897fc65e1ba7531a4830a7d935ab15d8bec6", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.08449275358778685, "ground_truth": 0}, {"key": "6f64897fc65e1ba7531a4830a7d935ab15d8bec6", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.30404166194100773, "ground_truth": 0}, {"key": "6f64897fc65e1ba7531a4830a7d935ab15d8bec6", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.46490157675783683, "ground_truth": 0}, {"key": "6f64897fc65e1ba7531a4830a7d935ab15d8bec6", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.08945460293876699, "ground_truth": 0}, {"key": "6f64897fc65e1ba7531a4830a7d935ab15d8bec6", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.05320620674176438, "ground_truth": 0}, {"key": "0d7383a44955b41c5a472151a35a842751f0004c", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.02942357960580907, "ground_truth": 0}, {"key": "0d7383a44955b41c5a472151a35a842751f0004c", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.07531230747458868, "ground_truth": 0}, {"key": "0d7383a44955b41c5a472151a35a842751f0004c", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.02280263726951939, "ground_truth": 0}, {"key": "0d7383a44955b41c5a472151a35a842751f0004c", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.05419873095222884, "ground_truth": 0}, {"key": "0d7383a44955b41c5a472151a35a842751f0004c", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.07640767837586927, "ground_truth": 0}, {"key": "2fddefe691f7849048548a15f6533339d4a25bfd", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.7599387701760343, "ground_truth": 0}, {"key": "2fddefe691f7849048548a15f6533339d4a25bfd", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.8577681137409536, "ground_truth": 0}, {"key": "2fddefe691f7849048548a15f6533339d4a25bfd", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.8392075641887667, "ground_truth": 0}, {"key": "2fddefe691f7849048548a15f6533339d4a25bfd", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.8633916012015033, "ground_truth": 0}, {"key": "2fddefe691f7849048548a15f6533339d4a25bfd", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.7739006197852052, "ground_truth": 0}, {"key": "e35ec8afe496d466d673ac67d80ec5c21b163410", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.5755879889358314, "ground_truth": 0}, {"key": "e35ec8afe496d466d673ac67d80ec5c21b163410", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.2974699484714712, "ground_truth": 0}, {"key": "e35ec8afe496d466d673ac67d80ec5c21b163410", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.5698526599535437, "ground_truth": 0}, {"key": "e35ec8afe496d466d673ac67d80ec5c21b163410", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.3575675090684452, "ground_truth": 0}, {"key": "e35ec8afe496d466d673ac67d80ec5c21b163410", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.3363310535883452, "ground_truth": 0}, {"key": "b4aa207f0723ae8a731dbc07ecdb03a68a42031f", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.0249877951476079, "ground_truth": 0}, {"key": "b4aa207f0723ae8a731dbc07ecdb03a68a42031f", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.13386749121339325, "ground_truth": 0}, {"key": "b4aa207f0723ae8a731dbc07ecdb03a68a42031f", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.06187598831303474, "ground_truth": 0}, {"key": "b4aa207f0723ae8a731dbc07ecdb03a68a42031f", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.057071399372513924, "ground_truth": 0}, {"key": "b4aa207f0723ae8a731dbc07ecdb03a68a42031f", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.18594721450624205, "ground_truth": 0}, {"key": "a65ecd71682863f7b12ca11ab8ac23b39ae302c4", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.04304284990136094, "ground_truth": 0}, {"key": "a65ecd71682863f7b12ca11ab8ac23b39ae302c4", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.14223189478947507, "ground_truth": 0}, {"key": "a65ecd71682863f7b12ca11ab8ac23b39ae302c4", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.027795623293501787, "ground_truth": 0}, {"key": "a65ecd71682863f7b12ca11ab8ac23b39ae302c4", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.07263670641166743, "ground_truth": 0}, {"key": "a65ecd71682863f7b12ca11ab8ac23b39ae302c4", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.018404890574336304, "ground_truth": 0}, {"key": "215a2a64c7bd36360f76ec5e159690de07d7d959", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.12210386661379359, "ground_truth": 0}, {"key": "215a2a64c7bd36360f76ec5e159690de07d7d959", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.32680832059679177, "ground_truth": 0}, {"key": "215a2a64c7bd36360f76ec5e159690de07d7d959", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.25832597646675115, "ground_truth": 0}, {"key": "215a2a64c7bd36360f76ec5e159690de07d7d959", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.25164771424630333, "ground_truth": 0}, {"key": "215a2a64c7bd36360f76ec5e159690de07d7d959", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.2925953032325942, "ground_truth": 0}, {"key": "39074eb06df4966d1e06f76ad2f0713b31335fe5", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.11047115049748732, "ground_truth": 0}, {"key": "39074eb06df4966d1e06f76ad2f0713b31335fe5", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.09401018459108083, "ground_truth": 0}, {"key": "39074eb06df4966d1e06f76ad2f0713b31335fe5", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.03126191536108638, "ground_truth": 0}, {"key": "39074eb06df4966d1e06f76ad2f0713b31335fe5", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.16344543756411586, "ground_truth": 0}, {"key": "39074eb06df4966d1e06f76ad2f0713b31335fe5", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.09301680199980882, "ground_truth": 0}, {"key": "3cae0d9bcf97b5d182b20a31aaea3f41cd7bf599", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.03978780711723618, "ground_truth": 0}, {"key": "3cae0d9bcf97b5d182b20a31aaea3f41cd7bf599", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.10374862593961436, "ground_truth": 0}, {"key": "3cae0d9bcf97b5d182b20a31aaea3f41cd7bf599", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.06632687175657778, "ground_truth": 0}, {"key": "3cae0d9bcf97b5d182b20a31aaea3f41cd7bf599", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.02315340933157891, "ground_truth": 0}, {"key": "3cae0d9bcf97b5d182b20a31aaea3f41cd7bf599", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.03817827659371946, "ground_truth": 0}, {"key": "6a9ead70f9423e494c466189bc6d907071547f42", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.2005576811561284, "ground_truth": 0}, {"key": "6a9ead70f9423e494c466189bc6d907071547f42", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.4436004250444295, "ground_truth": 0}, {"key": "6a9ead70f9423e494c466189bc6d907071547f42", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.455198622897653, "ground_truth": 0}, {"key": "6a9ead70f9423e494c466189bc6d907071547f42", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.17667161490496103, "ground_truth": 0}, {"key": "6a9ead70f9423e494c466189bc6d907071547f42", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.24798743917595806, "ground_truth": 0}, {"key": "9a15663058028878027f6aa039fb3185c2ff52c8", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.37022539077583866, "ground_truth": 0}, {"key": "9a15663058028878027f6aa039fb3185c2ff52c8", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.6406358611146163, "ground_truth": 0}, {"key": "9a15663058028878027f6aa039fb3185c2ff52c8", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.466845615165986, "ground_truth": 0}, {"key": "9a15663058028878027f6aa039fb3185c2ff52c8", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.25832598552414054, "ground_truth": 0}, {"key": "9a15663058028878027f6aa039fb3185c2ff52c8", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.40922079581846826, "ground_truth": 0}, {"key": "83cb0c7e79d4c71703e1bd5fc346fe68be8b8b13", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.03676946399703596, "ground_truth": 0}, {"key": "83cb0c7e79d4c71703e1bd5fc346fe68be8b8b13", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.1968261964945499, "ground_truth": 0}, {"key": "83cb0c7e79d4c71703e1bd5fc346fe68be8b8b13", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.08882029269634752, "ground_truth": 0}, {"key": "83cb0c7e79d4c71703e1bd5fc346fe68be8b8b13", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.11676401256172468, "ground_truth": 0}, {"key": "83cb0c7e79d4c71703e1bd5fc346fe68be8b8b13", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.1320661446699863, "ground_truth": 0}, {"key": "5eb63517219a5d2aeebd21aa66d9b69c52cfb208", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.19314737763703546, "ground_truth": 0}, {"key": "5eb63517219a5d2aeebd21aa66d9b69c52cfb208", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.5370413958629681, "ground_truth": 0}, {"key": "5eb63517219a5d2aeebd21aa66d9b69c52cfb208", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.2861692472208626, "ground_truth": 0}, {"key": "5eb63517219a5d2aeebd21aa66d9b69c52cfb208", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.2782567810789583, "ground_truth": 0}, {"key": "5eb63517219a5d2aeebd21aa66d9b69c52cfb208", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.21206881553871998, "ground_truth": 0}, {"key": "4a1de02b50578df33ea7b0cb384bdd6aaf4ee119", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.10230470475816099, "ground_truth": 0}, {"key": "4a1de02b50578df33ea7b0cb384bdd6aaf4ee119", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.0346188413541546, "ground_truth": 0}, {"key": "4a1de02b50578df33ea7b0cb384bdd6aaf4ee119", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.15817436017500516, "ground_truth": 0}, {"key": "4a1de02b50578df33ea7b0cb384bdd6aaf4ee119", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.18952109845689577, "ground_truth": 0}, {"key": "4a1de02b50578df33ea7b0cb384bdd6aaf4ee119", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.17217185004115704, "ground_truth": 0}, {"key": "ddedfc2a349fb607ed7efeda1660e9807454ddb7", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.1766716121080098, "ground_truth": 0}, {"key": "ddedfc2a349fb607ed7efeda1660e9807454ddb7", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.2689414420588182, "ground_truth": 0}, {"key": "ddedfc2a349fb607ed7efeda1660e9807454ddb7", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.09534946594137424, "ground_truth": 0}, {"key": "ddedfc2a349fb607ed7efeda1660e9807454ddb7", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.10521053507840795, "ground_truth": 0}, {"key": "ddedfc2a349fb607ed7efeda1660e9807454ddb7", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.12085323006117094, "ground_truth": 0}, {"key": "1cce8238a161fda411022c350d2b9a49072f366f", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.062331041914330816, "ground_truth": 0}, {"key": "1cce8238a161fda411022c350d2b9a49072f366f", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.06656918982714473, "ground_truth": 0}, {"key": "1cce8238a161fda411022c350d2b9a49072f366f", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.05964693991800891, "ground_truth": 0}, {"key": "1cce8238a161fda411022c350d2b9a49072f366f", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.04115288712061932, "ground_truth": 0}, {"key": "1cce8238a161fda411022c350d2b9a49072f366f", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.03622005944550337, "ground_truth": 0}, {"key": "0612042c0c7d5cf6459f5435402919673c8c552f", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.030100335343229326, "ground_truth": 0}, {"key": "0612042c0c7d5cf6459f5435402919673c8c552f", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.2942149740808543, "ground_truth": 0}, {"key": "0612042c0c7d5cf6459f5435402919673c8c552f", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.10631887177862238, "ground_truth": 0}, {"key": "0612042c0c7d5cf6459f5435402919673c8c552f", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.05942821999781286, "ground_truth": 0}, {"key": "0612042c0c7d5cf6459f5435402919673c8c552f", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.12168575445236764, "ground_truth": 0}, {"key": "cbe1f7ee7f5d619093684cc123e3908e39d79c92", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.592666589284092, "ground_truth": 0}, {"key": "cbe1f7ee7f5d619093684cc123e3908e39d79c92", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.8459424361027147, "ground_truth": 0}, {"key": "cbe1f7ee7f5d619093684cc123e3908e39d79c92", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.9504109755841098, "ground_truth": 0}, {"key": "cbe1f7ee7f5d619093684cc123e3908e39d79c92", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.9082930339377375, "ground_truth": 0}, {"key": "cbe1f7ee7f5d619093684cc123e3908e39d79c92", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.8272706896576254, "ground_truth": 0}, {"key": "42be47d5986a9a55b413eb57359d2d8c51b59024", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.3115315848042208, "ground_truth": 0}, {"key": "42be47d5986a9a55b413eb57359d2d8c51b59024", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.3468730811808235, "ground_truth": 0}, {"key": "42be47d5986a9a55b413eb57359d2d8c51b59024", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.25832596663147395, "ground_truth": 0}, {"key": "42be47d5986a9a55b413eb57359d2d8c51b59024", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.27512972086062537, "ground_truth": 0}, {"key": "42be47d5986a9a55b413eb57359d2d8c51b59024", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.36477757299260255, "ground_truth": 0}, {"key": "9f997964709283520a65d2ce75de7c8b154ce351", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.7170118639598302, "ground_truth": 0}, {"key": "9f997964709283520a65d2ce75de7c8b154ce351", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.20307463541859125, "ground_truth": 0}, {"key": "9f997964709283520a65d2ce75de7c8b154ce351", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.4416730251958242, "ground_truth": 0}, {"key": "9f997964709283520a65d2ce75de7c8b154ce351", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.6774740104557735, "ground_truth": 0}, {"key": "9f997964709283520a65d2ce75de7c8b154ce351", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.3720487794787613, "ground_truth": 0}, {"key": "57da930302d81b46438b0f715a5218b7174a5611", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.2845760189371703, "ground_truth": 0}, {"key": "57da930302d81b46438b0f715a5218b7174a5611", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.2407745955691309, "ground_truth": 0}, {"key": "57da930302d81b46438b0f715a5218b7174a5611", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.13568954458058588, "ground_truth": 0}, {"key": "57da930302d81b46438b0f715a5218b7174a5611", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.34864515166289933, "ground_truth": 0}, {"key": "57da930302d81b46438b0f715a5218b7174a5611", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.5660185217003487, "ground_truth": 0}, {"key": "bc639974d283826b3b928bf90f0951652db71fd4", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.761361090754894, "ground_truth": 0}, {"key": "bc639974d283826b3b928bf90f0951652db71fd4", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.5156199273274973, "ground_truth": 0}, {"key": "bc639974d283826b3b928bf90f0951652db71fd4", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.4493926087010804, "ground_truth": 0}, {"key": "bc639974d283826b3b928bf90f0951652db71fd4", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.4320634034669176, "ground_truth": 0}, {"key": "bc639974d283826b3b928bf90f0951652db71fd4", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.9856076627963387, "ground_truth": 0}, {"key": "304002bc095b57d14b728ccfb8d704ef39f28813", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.2583259662068332, "ground_truth": 0}, {"key": "304002bc095b57d14b728ccfb8d704ef39f28813", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.2186693611147085, "ground_truth": 0}, {"key": "304002bc095b57d14b728ccfb8d704ef39f28813", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.10743747189886545, "ground_truth": 0}, {"key": "304002bc095b57d14b728ccfb8d704ef39f28813", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.10374862900953426, "ground_truth": 0}, {"key": "304002bc095b57d14b728ccfb8d704ef39f28813", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.3174262874944161, "ground_truth": 0}, {"key": "fab941df6ecc8251b49d28715504baf4ac31dcf9", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.19436782598085478, "ground_truth": 0}, {"key": "fab941df6ecc8251b49d28715504baf4ac31dcf9", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.08570927584594812, "ground_truth": 0}, {"key": "fab941df6ecc8251b49d28715504baf4ac31dcf9", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.10669060229553529, "ground_truth": 0}, {"key": "fab941df6ecc8251b49d28715504baf4ac31dcf9", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.1311732207704874, "ground_truth": 0}, {"key": "fab941df6ecc8251b49d28715504baf4ac31dcf9", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.058345840883651336, "ground_truth": 0}, {"key": "92dec9732f4244771770150d82cd6086f40e5621", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.11920292018951109, "ground_truth": 0}, {"key": "92dec9732f4244771770150d82cd6086f40e5621", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.08181271583133212, "ground_truth": 0}, {"key": "92dec9732f4244771770150d82cd6086f40e5621", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.16667539267045264, "ground_truth": 0}, {"key": "92dec9732f4244771770150d82cd6086f40e5621", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.023689470144868215, "ground_truth": 0}, {"key": "92dec9732f4244771770150d82cd6086f40e5621", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.20497774503534533, "ground_truth": 0}, {"key": "d2ed554726c632af6e2130a580964a261f8c2e60", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.8958875868105675, "ground_truth": 0}, {"key": "d2ed554726c632af6e2130a580964a261f8c2e60", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.7476159656867416, "ground_truth": 0}, {"key": "d2ed554726c632af6e2130a580964a261f8c2e60", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.8300437677064342, "ground_truth": 0}, {"key": "d2ed554726c632af6e2130a580964a261f8c2e60", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.8714748649435817, "ground_truth": 0}, {"key": "d2ed554726c632af6e2130a580964a261f8c2e60", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.5583269881517748, "ground_truth": 0}, {"key": "84ab5256295369509813877f5000bb7e01e7f641", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.1943678178183983, "ground_truth": 0}, {"key": "84ab5256295369509813877f5000bb7e01e7f641", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.0536011436972634, "ground_truth": 0}, {"key": "84ab5256295369509813877f5000bb7e01e7f641", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.26588046065327586, "ground_truth": 0}, {"key": "84ab5256295369509813877f5000bb7e01e7f641", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.08151975143290319, "ground_truth": 0}, {"key": "84ab5256295369509813877f5000bb7e01e7f641", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.13028543201541593, "ground_truth": 0}, {"key": "0e3f2fa30b711144fd8e49dedd6c248542a9083c", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.029760093808605406, "ground_truth": 0}, {"key": "0e3f2fa30b711144fd8e49dedd6c248542a9083c", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.028436034466215773, "ground_truth": 0}, {"key": "0e3f2fa30b711144fd8e49dedd6c248542a9083c", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.06187598346015445, "ground_truth": 0}, {"key": "0e3f2fa30b711144fd8e49dedd6c248542a9083c", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.03875619481041986, "ground_truth": 0}, {"key": "0e3f2fa30b711144fd8e49dedd6c248542a9083c", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.025371312390760112, "ground_truth": 0}, {"key": "67ab697c3e2d707e3b7d070199b065b1541c8925", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.02220122897922175, "ground_truth": 0}, {"key": "67ab697c3e2d707e3b7d070199b065b1541c8925", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.040540736348142245, "ground_truth": 0}, {"key": "67ab697c3e2d707e3b7d070199b065b1541c8925", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.02887090739348641, "ground_truth": 0}, {"key": "67ab697c3e2d707e3b7d070199b065b1541c8925", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.024330189653768385, "ground_truth": 0}, {"key": "67ab697c3e2d707e3b7d070199b065b1541c8925", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.07316471817855817, "ground_truth": 0}, {"key": "71537a701b69838dcb68ae310c7b3bfb375c1344", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.1812632071977273, "ground_truth": 0}, {"key": "71537a701b69838dcb68ae310c7b3bfb375c1344", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.2553436445636697, "ground_truth": 0}, {"key": "71537a701b69838dcb68ae310c7b3bfb375c1344", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.47268346349607143, "ground_truth": 0}, {"key": "71537a701b69838dcb68ae310c7b3bfb375c1344", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.27202457126826196, "ground_truth": 0}, {"key": "71537a701b69838dcb68ae310c7b3bfb375c1344", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.3276682918681146, "ground_truth": 0}, {"key": "83989da5142972bb45c7f1e25ea60c6b101a9987", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.08819004663109373, "ground_truth": 0}, {"key": "83989da5142972bb45c7f1e25ea60c6b101a9987", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.131173221301455, "ground_truth": 0}, {"key": "83989da5142972bb45c7f1e25ea60c6b101a9987", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.11085559197909937, "ground_truth": 0}, {"key": "83989da5142972bb45c7f1e25ea60c6b101a9987", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.20497774396641807, "ground_truth": 0}, {"key": "83989da5142972bb45c7f1e25ea60c6b101a9987", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.17050800389815296, "ground_truth": 0}, {"key": "cc432e8a26891d7fcb62b112f868e994532a7ba7", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.5583269918485662, "ground_truth": 0}, {"key": "cc432e8a26891d7fcb62b112f868e994532a7ba7", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.13206615218561327, "ground_truth": 0}, {"key": "cc432e8a26891d7fcb62b112f868e994532a7ba7", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.1835936295358144, "ground_truth": 0}, {"key": "cc432e8a26891d7fcb62b112f868e994532a7ba7", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.116764008552767, "ground_truth": 0}, {"key": "cc432e8a26891d7fcb62b112f868e994532a7ba7", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.166675401356418, "ground_truth": 0}, {"key": "ef024e4ca04bd445d2915e7fe5c2c3c9b6f723a2", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.15817435278120873, "ground_truth": 0}, {"key": "ef024e4ca04bd445d2915e7fe5c2c3c9b6f723a2", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.17217185315224195, "ground_truth": 0}, {"key": "ef024e4ca04bd445d2915e7fe5c2c3c9b6f723a2", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.44167301692381034, "ground_truth": 0}, {"key": "ef024e4ca04bd445d2915e7fe5c2c3c9b6f723a2", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.3363310233893453, "ground_truth": 0}, {"key": "ef024e4ca04bd445d2915e7fe5c2c3c9b6f723a2", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.2605775669866123, "ground_truth": 0}, {"key": "dfc606b97c43ac249d72cff2fe812213987a37a2", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.1721718561776798, "ground_truth": 0}, {"key": "dfc606b97c43ac249d72cff2fe812213987a37a2", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.0598664224861799, "ground_truth": 0}, {"key": "dfc606b97c43ac249d72cff2fe812213987a37a2", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.2720245666730308, "ground_truth": 0}, {"key": "dfc606b97c43ac249d72cff2fe812213987a37a2", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.19930801064670908, "ground_truth": 0}, {"key": "dfc606b97c43ac249d72cff2fe812213987a37a2", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.1530421560981452, "ground_truth": 0}, {"key": "087ac92e2ca469b5ca6277950e63b2f0706d0de2", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.22405545530993107, "ground_truth": 0}, {"key": "087ac92e2ca469b5ca6277950e63b2f0706d0de2", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.4649015653264979, "ground_truth": 0}, {"key": "087ac92e2ca469b5ca6277950e63b2f0706d0de2", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.27982849505697904, "ground_truth": 0}, {"key": "087ac92e2ca469b5ca6277950e63b2f0706d0de2", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.3849121488421663, "ground_truth": 0}, {"key": "087ac92e2ca469b5ca6277950e63b2f0706d0de2", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.15102780844071778, "ground_truth": 0}, {"key": "a1abb9ce1c76a6c390233d8ec934cfb34bc35215", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.6943026743704374, "ground_truth": 0}, {"key": "a1abb9ce1c76a6c390233d8ec934cfb34bc35215", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.19436782050051452, "ground_truth": 0}, {"key": "a1abb9ce1c76a6c390233d8ec934cfb34bc35215", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.2568319895856095, "ground_truth": 0}, {"key": "a1abb9ce1c76a6c390233d8ec934cfb34bc35215", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.21206880655534568, "ground_truth": 0}, {"key": "a1abb9ce1c76a6c390233d8ec934cfb34bc35215", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.4824291196314642, "ground_truth": 0}, {"key": "99ec57979392a7f9c1a24158d5e1262cdf113f45", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.5117166003777758, "ground_truth": 0}, {"key": "99ec57979392a7f9c1a24158d5e1262cdf113f45", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.2766905247660207, "ground_truth": 0}, {"key": "99ec57979392a7f9c1a24158d5e1262cdf113f45", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.5370414061487494, "ground_truth": 0}, {"key": "99ec57979392a7f9c1a24158d5e1262cdf113f45", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.3073580300626502, "ground_truth": 0}, {"key": "99ec57979392a7f9c1a24158d5e1262cdf113f45", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.46101677997934565, "ground_truth": 0}, {"key": "ca5c0c816376354b82a4a7b9fa9a31b655e2d2cd", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.1285251380114962, "ground_truth": 0}, {"key": "ca5c0c816376354b82a4a7b9fa9a31b655e2d2cd", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.8489721890523664, "ground_truth": 0}, {"key": "ca5c0c816376354b82a4a7b9fa9a31b655e2d2cd", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.3345894354681565, "ground_truth": 0}, {"key": "ca5c0c816376354b82a4a7b9fa9a31b655e2d2cd", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.37570647576926336, "ground_truth": 0}, {"key": "ca5c0c816376354b82a4a7b9fa9a31b655e2d2cd", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.6706082939795991, "ground_truth": 0}, {"key": "e9787bf9462b12b7dfc0b562510a551e7d07b4d7", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.0875638468495505, "ground_truth": 0}, {"key": "e9787bf9462b12b7dfc0b562510a551e7d07b4d7", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.15002883166225192, "ground_truth": 0}, {"key": "e9787bf9462b12b7dfc0b562510a551e7d07b4d7", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.3276682996817513, "ground_truth": 0}, {"key": "e9787bf9462b12b7dfc0b562510a551e7d07b4d7", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.12678517186081437, "ground_truth": 0}, {"key": "e9787bf9462b12b7dfc0b562510a551e7d07b4d7", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.12765262787210718, "ground_truth": 0}, {"key": "ed8a7d5b06b4b5415725e624a15ab5ada7146894", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.24798743177194474, "ground_truth": 0}, {"key": "ed8a7d5b06b4b5415725e624a15ab5ada7146894", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.14953138272206323, "ground_truth": 0}, {"key": "ed8a7d5b06b4b5415725e624a15ab5ada7146894", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.21601153182544564, "ground_truth": 0}, {"key": "ed8a7d5b06b4b5415725e624a15ab5ada7146894", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.06394842084888037, "ground_truth": 0}, {"key": "ed8a7d5b06b4b5415725e624a15ab5ada7146894", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.168856950549047, "ground_truth": 0}, {"key": "4b6f2532f6bb4cf4ae341e4fb72d384ef58f0f42", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.3923368480925097, "ground_truth": 0}, {"key": "4b6f2532f6bb4cf4ae341e4fb72d384ef58f0f42", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.8732148276446668, "ground_truth": 0}, {"key": "4b6f2532f6bb4cf4ae341e4fb72d384ef58f0f42", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.769773232701639, "ground_truth": 0}, {"key": "4b6f2532f6bb4cf4ae341e4fb72d384ef58f0f42", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.5621765146161177, "ground_truth": 0}, {"key": "4b6f2532f6bb4cf4ae341e4fb72d384ef58f0f42", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.6884684173027108, "ground_truth": 0}, {"key": "46102a68e2927f930c1c2bd117ca714d188cd1ab", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.014172366139943344, "ground_truth": 0}, {"key": "46102a68e2927f930c1c2bd117ca714d188cd1ab", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.010652511516038556, "ground_truth": 0}, {"key": "46102a68e2927f930c1c2bd117ca714d188cd1ab", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.017576884850383914, "ground_truth": 0}, {"key": "46102a68e2927f930c1c2bd117ca714d188cd1ab", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.07558478528574132, "ground_truth": 0}, {"key": "46102a68e2927f930c1c2bd117ca714d188cd1ab", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.01530635554959487, "ground_truth": 0}, {"key": "ee6568a8880e61a498aab80c41f70939d567c991", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.2030746249942554, "ground_truth": 0}, {"key": "ee6568a8880e61a498aab80c41f70939d567c991", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.20882358691766498, "ground_truth": 0}, {"key": "ee6568a8880e61a498aab80c41f70939d567c991", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.28457601308438424, "ground_truth": 0}, {"key": "ee6568a8880e61a498aab80c41f70939d567c991", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.19012182542518236, "ground_truth": 0}, {"key": "ee6568a8880e61a498aab80c41f70939d567c991", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.2160115402057281, "ground_truth": 0}, {"key": "8f462be265750ebbf85a6ad8ef28cb39c59f826e", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.01219413350471357, "ground_truth": 0}, {"key": "8f462be265750ebbf85a6ad8ef28cb39c59f826e", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.02865267007029879, "ground_truth": 0}, {"key": "8f462be265750ebbf85a6ad8ef28cb39c59f826e", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.09807932467354606, "ground_truth": 0}, {"key": "8f462be265750ebbf85a6ad8ef28cb39c59f826e", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.0390482897177472, "ground_truth": 0}, {"key": "8f462be265750ebbf85a6ad8ef28cb39c59f826e", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.02350945090511069, "ground_truth": 0}, {"key": "b21258342db561f79656c3c75f2e8c8244dd6178", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.41489883116445037, "ground_truth": 0}, {"key": "b21258342db561f79656c3c75f2e8c8244dd6178", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.3793784098088506, "ground_truth": 0}, {"key": "b21258342db561f79656c3c75f2e8c8244dd6178", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.4282334015703866, "ground_truth": 0}, {"key": "b21258342db561f79656c3c75f2e8c8244dd6178", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.45326185463732294, "ground_truth": 0}, {"key": "b21258342db561f79656c3c75f2e8c8244dd6178", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.5175708826012057, "ground_truth": 0}, {"key": "c7b97c7c2ca7b9bedff4978dd3cae9aaef8f8100", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.041462272630610926, "ground_truth": 0}, {"key": "c7b97c7c2ca7b9bedff4978dd3cae9aaef8f8100", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.02615561870080488, "ground_truth": 0}, {"key": "c7b97c7c2ca7b9bedff4978dd3cae9aaef8f8100", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.11436852740564948, "ground_truth": 0}, {"key": "c7b97c7c2ca7b9bedff4978dd3cae9aaef8f8100", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.23792989567489076, "ground_truth": 0}, {"key": "c7b97c7c2ca7b9bedff4978dd3cae9aaef8f8100", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.04977344608527131, "ground_truth": 0}, {"key": "bdbeb9265050f2a4ce200c3802775694b7dc20e6", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.17328821685654652, "ground_truth": 0}, {"key": "bdbeb9265050f2a4ce200c3802775694b7dc20e6", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.5832033416499481, "ground_truth": 0}, {"key": "bdbeb9265050f2a4ce200c3802775694b7dc20e6", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.5964331350254715, "ground_truth": 0}, {"key": "bdbeb9265050f2a4ce200c3802775694b7dc20e6", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.2295352007611083, "ground_truth": 0}, {"key": "bdbeb9265050f2a4ce200c3802775694b7dc20e6", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.2479874376720046, "ground_truth": 0}, {"key": "42e93d5aef7547b8169f1f6c7735d0265a030580", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.0484960061744463, "ground_truth": 0}, {"key": "42e93d5aef7547b8169f1f6c7735d0265a030580", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.056444021879725206, "ground_truth": 0}, {"key": "42e93d5aef7547b8169f1f6c7735d0265a030580", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.006026951903748281, "ground_truth": 0}, {"key": "42e93d5aef7547b8169f1f6c7735d0265a030580", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.010248601581693866, "ground_truth": 0}, {"key": "42e93d5aef7547b8169f1f6c7735d0265a030580", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.04418332169999852, "ground_truth": 0}, {"key": "6e7a607934780f0011aa4e84509314efe15c2685", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.08819004874994951, "ground_truth": 0}, {"key": "6e7a607934780f0011aa4e84509314efe15c2685", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.1907240144136078, "ground_truth": 0}, {"key": "6e7a607934780f0011aa4e84509314efe15c2685", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.11357958350927838, "ground_truth": 0}, {"key": "6e7a607934780f0011aa4e84509314efe15c2685", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.09670579010369382, "ground_truth": 0}, {"key": "6e7a607934780f0011aa4e84509314efe15c2685", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.04369106197075956, "ground_truth": 0}, {"key": "c087e2af172aed145b177c9a1a68029205bc732a", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.1403362473806831, "ground_truth": 0}, {"key": "c087e2af172aed145b177c9a1a68029205bc732a", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.3647775627677294, "ground_truth": 0}, {"key": "c087e2af172aed145b177c9a1a68029205bc732a", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.1100878769913572, "ground_truth": 0}, {"key": "c087e2af172aed145b177c9a1a68029205bc732a", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.13432105670731861, "ground_truth": 0}, {"key": "c087e2af172aed145b177c9a1a68029205bc732a", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.12896330233870248, "ground_truth": 0}, {"key": "40e79de5b7a27d7161b147725936d1d47e45c8f9", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.24871662631351535, "ground_truth": 0}, {"key": "40e79de5b7a27d7161b147725936d1d47e45c8f9", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.1895210966818272, "ground_truth": 0}, {"key": "40e79de5b7a27d7161b147725936d1d47e45c8f9", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.12592277257865056, "ground_truth": 0}, {"key": "40e79de5b7a27d7161b147725936d1d47e45c8f9", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.39233683527711344, "ground_truth": 0}, {"key": "40e79de5b7a27d7161b147725936d1d47e45c8f9", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.08945459869913845, "ground_truth": 0}, {"key": "e878909ace599352d3d578796968bbd52cb299bd", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.01224127588822362, "ground_truth": 0}, {"key": "e878909ace599352d3d578796968bbd52cb299bd", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.03222229635596871, "ground_truth": 0}, {"key": "e878909ace599352d3d578796968bbd52cb299bd", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.04272219914753011, "ground_truth": 0}, {"key": "e878909ace599352d3d578796968bbd52cb299bd", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.10894504067077293, "ground_truth": 0}, {"key": "e878909ace599352d3d578796968bbd52cb299bd", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.06325052271440587, "ground_truth": 0}, {"key": "470708aab0fe600a27423bf4a2f8c9860fe5f64b", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.04177387797643355, "ground_truth": 0}, {"key": "470708aab0fe600a27423bf4a2f8c9860fe5f64b", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.4186969263201728, "ground_truth": 0}, {"key": "470708aab0fe600a27423bf4a2f8c9860fe5f64b", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.04672496014151491, "ground_truth": 0}, {"key": "470708aab0fe600a27423bf4a2f8c9860fe5f64b", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.13028542345120916, "ground_truth": 0}, {"key": "470708aab0fe600a27423bf4a2f8c9860fe5f64b", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.7106282975481751, "ground_truth": 0}, {"key": "16e8cb520c874af6825d4661f6127a67efd4b6f6", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.14804718661973496, "ground_truth": 0}, {"key": "16e8cb520c874af6825d4661f6127a67efd4b6f6", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.13206614910494469, "ground_truth": 0}, {"key": "16e8cb520c874af6825d4661f6127a67efd4b6f6", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.22815648870502514, "ground_truth": 0}, {"key": "16e8cb520c874af6825d4661f6127a67efd4b6f6", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.11124121422577371, "ground_truth": 0}, {"key": "16e8cb520c874af6825d4661f6127a67efd4b6f6", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.20561504342473583, "ground_truth": 0}, {"key": "38673348ff28676905791fe3e8db2bbda814d974", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.03333682483212953, "ground_truth": 0}, {"key": "38673348ff28676905791fe3e8db2bbda814d974", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.09009299277118031, "ground_truth": 0}, {"key": "38673348ff28676905791fe3e8db2bbda814d974", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.3557748760795176, "ground_truth": 0}, {"key": "38673348ff28676905791fe3e8db2bbda814d974", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.04672495527068391, "ground_truth": 0}, {"key": "38673348ff28676905791fe3e8db2bbda814d974", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.12336562278681977, "ground_truth": 0}, {"key": "914a0163e25ecccb635b601837cc4dd552c66ce0", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.2909808730587328, "ground_truth": 0}, {"key": "914a0163e25ecccb635b601837cc4dd552c66ce0", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.13386749282580668, "ground_truth": 0}, {"key": "914a0163e25ecccb635b601837cc4dd552c66ce0", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.343341726760267, "ground_truth": 0}, {"key": "914a0163e25ecccb635b601837cc4dd552c66ce0", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.5273165303483316, "ground_truth": 0}, {"key": "914a0163e25ecccb635b601837cc4dd552c66ce0", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.24220564393198385, "ground_truth": 0}, {"key": "851c7314af56b6f47742970e11696948323dfe94", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.11596071647260094, "ground_truth": 0}, {"key": "851c7314af56b6f47742970e11696948323dfe94", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.045692032515130765, "ground_truth": 0}, {"key": "851c7314af56b6f47742970e11696948323dfe94", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.05146276339786989, "ground_truth": 0}, {"key": "851c7314af56b6f47742970e11696948323dfe94", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.09401018570196418, "ground_truth": 0}, {"key": "851c7314af56b6f47742970e11696948323dfe94", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.0940101825348545, "ground_truth": 0}, {"key": "f29f04e8f0615b768dd756c4387e87e27b7b4c2d", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.3174262854023708, "ground_truth": 0}, {"key": "f29f04e8f0615b768dd756c4387e87e27b7b4c2d", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.41300356440761754, "ground_truth": 0}, {"key": "f29f04e8f0615b768dd756c4387e87e27b7b4c2d", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.10594827847142549, "ground_truth": 0}, {"key": "f29f04e8f0615b768dd756c4387e87e27b7b4c2d", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.10447732424660909, "ground_truth": 0}, {"key": "f29f04e8f0615b768dd756c4387e87e27b7b4c2d", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.45907614542236486, "ground_truth": 0}, {"key": "8451164e86012e6dbf2fd39f7e6ca784ff9f3624", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.07978201619713826, "ground_truth": 0}, {"key": "8451164e86012e6dbf2fd39f7e6ca784ff9f3624", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.17553806670373695, "ground_truth": 0}, {"key": "8451164e86012e6dbf2fd39f7e6ca784ff9f3624", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.12592276320587864, "ground_truth": 0}, {"key": "8451164e86012e6dbf2fd39f7e6ca784ff9f3624", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.048496002638351056, "ground_truth": 0}, {"key": "8451164e86012e6dbf2fd39f7e6ca784ff9f3624", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.05089372506001484, "ground_truth": 0}, {"key": "18765fda59852b1c13eb226a2da9ab0979739f44", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.17217185344081157, "ground_truth": 0}, {"key": "18765fda59852b1c13eb226a2da9ab0979739f44", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.10302442192324374, "ground_truth": 0}, {"key": "18765fda59852b1c13eb226a2da9ab0979739f44", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.16344542504029652, "ground_truth": 0}, {"key": "18765fda59852b1c13eb226a2da9ab0979739f44", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.08035746511879721, "ground_truth": 0}, {"key": "18765fda59852b1c13eb226a2da9ab0979739f44", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.0414622773528674, "ground_truth": 0}, {"key": "fba410776268aaf447802e66ac94e4af54f7cb7a", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.8267117920720105, "ground_truth": 0}, {"key": "fba410776268aaf447802e66ac94e4af54f7cb7a", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.7279754416539773, "ground_truth": 0}, {"key": "fba410776268aaf447802e66ac94e4af54f7cb7a", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.9276259849725723, "ground_truth": 0}, {"key": "fba410776268aaf447802e66ac94e4af54f7cb7a", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.5019531509579996, "ground_truth": 0}, {"key": "fba410776268aaf447802e66ac94e4af54f7cb7a", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.6076631765227505, "ground_truth": 0}, {"key": "31494e5d6eda2042c4793ae68cea4b8304dfa0ad", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.6926419822803608, "ground_truth": 0}, {"key": "31494e5d6eda2042c4793ae68cea4b8304dfa0ad", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.7634837659128509, "ground_truth": 0}, {"key": "31494e5d6eda2042c4793ae68cea4b8304dfa0ad", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.7138307379772676, "ground_truth": 0}, {"key": "31494e5d6eda2042c4793ae68cea4b8304dfa0ad", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.6279512048316116, "ground_truth": 0}, {"key": "31494e5d6eda2042c4793ae68cea4b8304dfa0ad", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.5794004054872157, "ground_truth": 0}, {"key": "564bdb9bbcd2276bdfbdce6eb1e2058f0921bd82", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.15713685540875008, "ground_truth": 0}, {"key": "564bdb9bbcd2276bdfbdce6eb1e2058f0921bd82", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.09602549374188184, "ground_truth": 0}, {"key": "564bdb9bbcd2276bdfbdce6eb1e2058f0921bd82", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.2213506885773338, "ground_truth": 0}, {"key": "564bdb9bbcd2276bdfbdce6eb1e2058f0921bd82", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.27048023415247807, "ground_truth": 0}, {"key": "564bdb9bbcd2276bdfbdce6eb1e2058f0921bd82", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.20689405735162855, "ground_truth": 0}, {"key": "acbacec078274c02aeae06061357d02d950fec33", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.07369627714891108, "ground_truth": 0}, {"key": "acbacec078274c02aeae06061357d02d950fec33", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.19314737683191915, "ground_truth": 0}, {"key": "acbacec078274c02aeae06061357d02d950fec33", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.10557884153345287, "ground_truth": 0}, {"key": "acbacec078274c02aeae06061357d02d950fec33", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.05165378268302686, "ground_truth": 0}, {"key": "acbacec078274c02aeae06061357d02d950fec33", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.08882029186487488, "ground_truth": 0}, {"key": "04327bc3e426eee01ed61d369fd52415aa300ddc", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.10230470133287725, "ground_truth": 0}, {"key": "04327bc3e426eee01ed61d369fd52415aa300ddc", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.21206881010507408, "ground_truth": 0}, {"key": "04327bc3e426eee01ed61d369fd52415aa300ddc", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.14318770956943755, "ground_truth": 0}, {"key": "04327bc3e426eee01ed61d369fd52415aa300ddc", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.19436781863268074, "ground_truth": 0}, {"key": "04327bc3e426eee01ed61d369fd52415aa300ddc", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.509764385296816, "ground_truth": 0}, {"key": "b1f3d2adb48370e5ecadff8e6e3baff407b01f0e", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.17553806285360607, "ground_truth": 0}, {"key": "b1f3d2adb48370e5ecadff8e6e3baff407b01f0e", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.27669051797978483, "ground_truth": 0}, {"key": "b1f3d2adb48370e5ecadff8e6e3baff407b01f0e", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.14560062961525544, "ground_truth": 0}, {"key": "b1f3d2adb48370e5ecadff8e6e3baff407b01f0e", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.06465349293073672, "ground_truth": 0}, {"key": "b1f3d2adb48370e5ecadff8e6e3baff407b01f0e", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.0894546015705892, "ground_truth": 0}, {"key": "d7eaf2e5ca91bf54c05ead867e5e90728d44e218", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.7866228292642815, "ground_truth": 0}, {"key": "d7eaf2e5ca91bf54c05ead867e5e90728d44e218", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.451326528608277, "ground_truth": 0}, {"key": "d7eaf2e5ca91bf54c05ead867e5e90728d44e218", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.31912140456973725, "ground_truth": 0}, {"key": "d7eaf2e5ca91bf54c05ead867e5e90728d44e218", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.20561504417878357, "ground_truth": 0}, {"key": "d7eaf2e5ca91bf54c05ead867e5e90728d44e218", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.4436004137672499, "ground_truth": 0}, {"key": "1fcce9f667de2a14d76aaa6cdb3f1e6f7900e463", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.3007455527632041, "ground_truth": 0}, {"key": "1fcce9f667de2a14d76aaa6cdb3f1e6f7900e463", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.4513265127767736, "ground_truth": 0}, {"key": "1fcce9f667de2a14d76aaa6cdb3f1e6f7900e463", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.637030823105297, "ground_truth": 0}, {"key": "1fcce9f667de2a14d76aaa6cdb3f1e6f7900e463", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.4092207859211673, "ground_truth": 0}, {"key": "1fcce9f667de2a14d76aaa6cdb3f1e6f7900e463", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.5945512682172068, "ground_truth": 0}, {"key": "892f75a4d31560b60aa588faa6f4bf51322b8c18", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.03173859064832857, "ground_truth": 0}, {"key": "892f75a4d31560b60aa588faa6f4bf51322b8c18", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.038178275289611374, "ground_truth": 0}, {"key": "892f75a4d31560b60aa588faa6f4bf51322b8c18", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.04885777716487979, "ground_truth": 0}, {"key": "892f75a4d31560b60aa588faa6f4bf51322b8c18", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.07807816227453072, "ground_truth": 0}, {"key": "892f75a4d31560b60aa588faa6f4bf51322b8c18", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.07477004739606273, "ground_truth": 0}, {"key": "acf12bd8d1142648b1b522a3a925e14e48b8f068", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.07978201492985126, "ground_truth": 0}, {"key": "acf12bd8d1142648b1b522a3a925e14e48b8f068", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.08181271583133212, "ground_truth": 0}, {"key": "acf12bd8d1142648b1b522a3a925e14e48b8f068", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.0687872819595823, "ground_truth": 0}, {"key": "acf12bd8d1142648b1b522a3a925e14e48b8f068", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.018761083162094655, "ground_truth": 0}, {"key": "acf12bd8d1142648b1b522a3a925e14e48b8f068", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.09534946613221112, "ground_truth": 0}, {"key": "c8caeb08b05cc56e1ac29146793ceb07e4c0de69", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.6477982197751926, "ground_truth": 0}, {"key": "c8caeb08b05cc56e1ac29146793ceb07e4c0de69", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.803173786431461, "ground_truth": 0}, {"key": "c8caeb08b05cc56e1ac29146793ceb07e4c0de69", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.4687906219414736, "ground_truth": 0}, {"key": "c8caeb08b05cc56e1ac29146793ceb07e4c0de69", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.4148988325535028, "ground_truth": 0}, {"key": "c8caeb08b05cc56e1ac29146793ceb07e4c0de69", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.2782568055518643, "ground_truth": 0}, {"key": "ed7ed4440f5f7082230ae745d240350a4f20b8b7", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.19806417342420013, "ground_truth": 0}, {"key": "ed7ed4440f5f7082230ae745d240350a4f20b8b7", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.07864238490688037, "ground_truth": 0}, {"key": "ed7ed4440f5f7082230ae745d240350a4f20b8b7", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.3311197215358464, "ground_truth": 0}, {"key": "ed7ed4440f5f7082230ae745d240350a4f20b8b7", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.09073548219092803, "ground_truth": 0}, {"key": "ed7ed4440f5f7082230ae745d240350a4f20b8b7", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.13660839768509322, "ground_truth": 0}, {"key": "25b7adf8bfe43c2953a874b18c7766370158638a", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.09739039371139419, "ground_truth": 0}, {"key": "25b7adf8bfe43c2953a874b18c7766370158638a", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.6442251335678589, "ground_truth": 0}, {"key": "25b7adf8bfe43c2953a874b18c7766370158638a", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.06097518185172954, "ground_truth": 0}, {"key": "25b7adf8bfe43c2953a874b18c7766370158638a", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.756357533735535, "ground_truth": 0}, {"key": "25b7adf8bfe43c2953a874b18c7766370158638a", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.07316471970055781, "ground_truth": 0}, {"key": "771c125e3b0c54f1c3367b2857f15d689f081163", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.38676344583628014, "ground_truth": 0}, {"key": "771c125e3b0c54f1c3367b2857f15d689f081163", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.2365162441824134, "ground_truth": 0}, {"key": "771c125e3b0c54f1c3367b2857f15d689f081163", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.3647775802346118, "ground_truth": 0}, {"key": "771c125e3b0c54f1c3367b2857f15d689f081163", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.1289632985269772, "ground_truth": 0}, {"key": "771c125e3b0c54f1c3367b2857f15d689f081163", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.47073659237225146, "ground_truth": 0}, {"key": "4ad70f84c363e5b594da00983e2b40600f12ca54", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.03963884207369512, "ground_truth": 0}, {"key": "4ad70f84c363e5b594da00983e2b40600f12ca54", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.24364244544792485, "ground_truth": 0}, {"key": "4ad70f84c363e5b594da00983e2b40600f12ca54", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.03817827657543468, "ground_truth": 0}, {"key": "4ad70f84c363e5b594da00983e2b40600f12ca54", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.07107366873321685, "ground_truth": 0}, {"key": "4ad70f84c363e5b594da00983e2b40600f12ca54", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.26284184096898505, "ground_truth": 0}, {"key": "cbb5654e979eb27e0af71068cd4e4e5191df35ee", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.07978201284244742, "ground_truth": 0}, {"key": "cbb5654e979eb27e0af71068cd4e4e5191df35ee", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.13846178933113087, "ground_truth": 0}, {"key": "cbb5654e979eb27e0af71068cd4e4e5191df35ee", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.01678549090903791, "ground_truth": 0}, {"key": "cbb5654e979eb27e0af71068cd4e4e5191df35ee", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.044018655689184685, "ground_truth": 0}, {"key": "cbb5654e979eb27e0af71068cd4e4e5191df35ee", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.07751765708809585, "ground_truth": 0}, {"key": "bde6b7e505c05a15a9afe44739e7f016ce169735", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.12336560742799771, "ground_truth": 0}, {"key": "bde6b7e505c05a15a9afe44739e7f016ce169735", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.025957355660066864, "ground_truth": 0}, {"key": "bde6b7e505c05a15a9afe44739e7f016ce169735", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.09670578988702783, "ground_truth": 0}, {"key": "bde6b7e505c05a15a9afe44739e7f016ce169735", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.19314737532651274, "ground_truth": 0}, {"key": "bde6b7e505c05a15a9afe44739e7f016ce169735", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.135689551752503, "ground_truth": 0}, {"key": "abc4744227c6bf0ddbf64cac2269bd4c6d02938b", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.5019531301670647, "ground_truth": 0}, {"key": "abc4744227c6bf0ddbf64cac2269bd4c6d02938b", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.2658804759317735, "ground_truth": 0}, {"key": "abc4744227c6bf0ddbf64cac2269bd4c6d02938b", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.3225259750885588, "ground_truth": 0}, {"key": "abc4744227c6bf0ddbf64cac2269bd4c6d02938b", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.1175721320786299, "ground_truth": 0}, {"key": "abc4744227c6bf0ddbf64cac2269bd4c6d02938b", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.4092208115544763, "ground_truth": 0}, {"key": "f7e5e75031e9f099564ed046bd822ef1bedb3188", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.2227001297565736, "ground_truth": 0}, {"key": "f7e5e75031e9f099564ed046bd822ef1bedb3188", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.10743746749797146, "ground_truth": 0}, {"key": "f7e5e75031e9f099564ed046bd822ef1bedb3188", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.07004896489694319, "ground_truth": 0}, {"key": "f7e5e75031e9f099564ed046bd822ef1bedb3188", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.040237944387062324, "ground_truth": 0}, {"key": "f7e5e75031e9f099564ed046bd822ef1bedb3188", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.08389038851710907, "ground_truth": 0}, {"key": "9a8ee7eb582f293c617eecab5f37374d9400bb04", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.8386797614998446, "ground_truth": 0}, {"key": "9a8ee7eb582f293c617eecab5f37374d9400bb04", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.6934729416222477, "ground_truth": 0}, {"key": "9a8ee7eb582f293c617eecab5f37374d9400bb04", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.8740772354351927, "ground_truth": 0}, {"key": "9a8ee7eb582f293c617eecab5f37374d9400bb04", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.8683809583143878, "ground_truth": 0}, {"key": "9a8ee7eb582f293c617eecab5f37374d9400bb04", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.7178038157865482, "ground_truth": 0}, {"key": "a745e5a95be983cde00f3d472062c0627db3113c", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.2088235884663282, "ground_truth": 0}, {"key": "a745e5a95be983cde00f3d472062c0627db3113c", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.23651624405104194, "ground_truth": 0}, {"key": "a745e5a95be983cde00f3d472062c0627db3113c", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.325949521861267, "ground_truth": 0}, {"key": "a745e5a95be983cde00f3d472062c0627db3113c", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.08913693227107869, "ground_truth": 0}, {"key": "a745e5a95be983cde00f3d472062c0627db3113c", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.12808824154064333, "ground_truth": 0}, {"key": "698cdb1268d4da1240d7f540bd4a5af4e229d00f", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.10087861714355115, "ground_truth": 0}, {"key": "698cdb1268d4da1240d7f540bd4a5af4e229d00f", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.1366084056166002, "ground_truth": 0}, {"key": "698cdb1268d4da1240d7f540bd4a5af4e229d00f", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.17667161827523545, "ground_truth": 0}, {"key": "698cdb1268d4da1240d7f540bd4a5af4e229d00f", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.08035746260681333, "ground_truth": 0}, {"key": "698cdb1268d4da1240d7f540bd4a5af4e229d00f", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.4785288495060146, "ground_truth": 0}, {"key": "708c903fbf6a7c3c84f84ff34496eb0cb51f44e4", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.1216857527636958, "ground_truth": 0}, {"key": "708c903fbf6a7c3c84f84ff34496eb0cb51f44e4", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.1677633439444987, "ground_truth": 0}, {"key": "708c903fbf6a7c3c84f84ff34496eb0cb51f44e4", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.059646942757824346, "ground_truth": 0}, {"key": "708c903fbf6a7c3c84f84ff34496eb0cb51f44e4", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.14033625183130558, "ground_truth": 0}, {"key": "708c903fbf6a7c3c84f84ff34496eb0cb51f44e4", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.15817435633961113, "ground_truth": 0}, {"key": "26a1bafbde5cc970d5aee024dc8ef418587018a9", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.763483768030483, "ground_truth": 0}, {"key": "26a1bafbde5cc970d5aee024dc8ef418587018a9", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.4532618717815035, "ground_truth": 0}, {"key": "26a1bafbde5cc970d5aee024dc8ef418587018a9", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.6187804355142125, "ground_truth": 0}, {"key": "26a1bafbde5cc970d5aee024dc8ef418587018a9", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.47852882686218395, "ground_truth": 0}, {"key": "26a1bafbde5cc970d5aee024dc8ef418587018a9", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.5698526439992841, "ground_truth": 0}, {"key": "6832312991fe5d87d0e300374ec7a699a921f06a", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.11085559277114501, "ground_truth": 0}, {"key": "6832312991fe5d87d0e300374ec7a699a921f06a", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.13753247453984596, "ground_truth": 0}, {"key": "6832312991fe5d87d0e300374ec7a699a921f06a", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.14706452916307133, "ground_truth": 0}, {"key": "6832312991fe5d87d0e300374ec7a699a921f06a", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.08819004340203927, "ground_truth": 0}, {"key": "6832312991fe5d87d0e300374ec7a699a921f06a", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.1766716127748542, "ground_truth": 0}, {"key": "9c5d5d672c2549a594b801897a27dde1492e11d5", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.3090237194220892, "ground_truth": 0}, {"key": "9c5d5d672c2549a594b801897a27dde1492e11d5", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.7592254148672917, "ground_truth": 0}, {"key": "9c5d5d672c2549a594b801897a27dde1492e11d5", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.19314738058826697, "ground_truth": 0}, {"key": "9c5d5d672c2549a594b801897a27dde1492e11d5", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.3174262793512665, "ground_truth": 0}, {"key": "9c5d5d672c2549a594b801897a27dde1492e11d5", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.4707366269995745, "ground_truth": 0}, {"key": "c32fa9084fe8cd565890a940794e505d5f7ba4c2", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.10447731912247263, "ground_truth": 0}, {"key": "c32fa9084fe8cd565890a940794e505d5f7ba4c2", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.06804042057225003, "ground_truth": 0}, {"key": "c32fa9084fe8cd565890a940794e505d5f7ba4c2", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.060975184226208824, "ground_truth": 0}, {"key": "c32fa9084fe8cd565890a940794e505d5f7ba4c2", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.022715755659341228, "ground_truth": 0}, {"key": "c32fa9084fe8cd565890a940794e505d5f7ba4c2", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.041462277239435255, "ground_truth": 0}, {"key": "41b5dd6064864c16fbde9b46d37c9f7d9a56e705", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.24798744571227035, "ground_truth": 0}, {"key": "41b5dd6064864c16fbde9b46d37c9f7d9a56e705", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.0860158820018149, "ground_truth": 0}, {"key": "41b5dd6064864c16fbde9b46d37c9f7d9a56e705", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.052814021818494865, "ground_truth": 0}, {"key": "41b5dd6064864c16fbde9b46d37c9f7d9a56e705", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.19193278885292678, "ground_truth": 0}, {"key": "41b5dd6064864c16fbde9b46d37c9f7d9a56e705", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.1044773231442077, "ground_truth": 0}, {"key": "b2d3ba739af767da7aa25c3ba8e1d186168c3394", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.15713684829442862, "ground_truth": 0}, {"key": "b2d3ba739af767da7aa25c3ba8e1d186168c3394", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.09807932696375024, "ground_truth": 0}, {"key": "b2d3ba739af767da7aa25c3ba8e1d186168c3394", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.0960254970978129, "ground_truth": 0}, {"key": "b2d3ba739af767da7aa25c3ba8e1d186168c3394", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.18594720303438522, "ground_truth": 0}, {"key": "b2d3ba739af767da7aa25c3ba8e1d186168c3394", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.364777569651724, "ground_truth": 0}, {"key": "519fd9b5c5ca82979cdfee3c990c3590838d93c7", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.20181322054108977, "ground_truth": 0}, {"key": "519fd9b5c5ca82979cdfee3c990c3590838d93c7", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.5583269652573913, "ground_truth": 0}, {"key": "519fd9b5c5ca82979cdfee3c990c3590838d93c7", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.09807931774629249, "ground_truth": 0}, {"key": "519fd9b5c5ca82979cdfee3c990c3590838d93c7", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.09203287028978838, "ground_truth": 0}, {"key": "519fd9b5c5ca82979cdfee3c990c3590838d93c7", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.2160115323206058, "ground_truth": 0}, {"key": "60f518dff20b2936b104035b1fd9584dd7d16def", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.003721708635458557, "ground_truth": 0}, {"key": "60f518dff20b2936b104035b1fd9584dd7d16def", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.005301894749201639, "ground_truth": 0}, {"key": "60f518dff20b2936b104035b1fd9584dd7d16def", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.0027044293199265214, "ground_truth": 0}, {"key": "60f518dff20b2936b104035b1fd9584dd7d16def", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.005448067973278765, "ground_truth": 0}, {"key": "60f518dff20b2936b104035b1fd9584dd7d16def", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.0038393947955347014, "ground_truth": 0}, {"key": "b82546b760716f0a2b26606b07af0fe0dd61d6ff", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.0815197503657498, "ground_truth": 0}, {"key": "b82546b760716f0a2b26606b07af0fe0dd61d6ff", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.2942149639087695, "ground_truth": 0}, {"key": "b82546b760716f0a2b26606b07af0fe0dd61d6ff", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.05964694290532036, "ground_truth": 0}, {"key": "b82546b760716f0a2b26606b07af0fe0dd61d6ff", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.23091976125105648, "ground_truth": 0}, {"key": "b82546b760716f0a2b26606b07af0fe0dd61d6ff", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.15610489752120937, "ground_truth": 0}, {"key": "7990fde4a924299fab79f6c8e2b447ee5ffcd1fc", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.1602660380499175, "ground_truth": 0}, {"key": "7990fde4a924299fab79f6c8e2b447ee5ffcd1fc", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.6123096586710847, "ground_truth": 0}, {"key": "7990fde4a924299fab79f6c8e2b447ee5ffcd1fc", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.14706452672094897, "ground_truth": 0}, {"key": "7990fde4a924299fab79f6c8e2b447ee5ffcd1fc", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.2821962015389657, "ground_truth": 0}, {"key": "7990fde4a924299fab79f6c8e2b447ee5ffcd1fc", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.4707366080339853, "ground_truth": 0}, {"key": "504f6f6e1aea6bb73c728d12a1342faa6828aace", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.8714748667223706, "ground_truth": 0}, {"key": "504f6f6e1aea6bb73c728d12a1342faa6828aace", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.9227612168986506, "ground_truth": 0}, {"key": "504f6f6e1aea6bb73c728d12a1342faa6828aace", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.8774767753943442, "ground_truth": 0}, {"key": "504f6f6e1aea6bb73c728d12a1342faa6828aace", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.9049869589297048, "ground_truth": 0}, {"key": "504f6f6e1aea6bb73c728d12a1342faa6828aace", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.8914335747745785, "ground_truth": 0}, {"key": "ef42653bf9337de184e74be0160b807a41b526fd", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.5602526710451812, "ground_truth": 0}, {"key": "ef42653bf9337de184e74be0160b807a41b526fd", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.8745065469421203, "ground_truth": 0}, {"key": "ef42653bf9337de184e74be0160b807a41b526fd", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.5869964429771515, "ground_truth": 0}, {"key": "ef42653bf9337de184e74be0160b807a41b526fd", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.4843800494021508, "ground_truth": 0}, {"key": "ef42653bf9337de184e74be0160b807a41b526fd", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.9053222982617631, "ground_truth": 0}, {"key": "26d0a5624f3ee7605833c641da5d88e2259b1162", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.4941409075240592, "ground_truth": 0}, {"key": "26d0a5624f3ee7605833c641da5d88e2259b1162", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.5312093675350222, "ground_truth": 0}, {"key": "26d0a5624f3ee7605833c641da5d88e2259b1162", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.3225259763873628, "ground_truth": 0}, {"key": "26d0a5624f3ee7605833c641da5d88e2259b1162", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.3032157391218124, "ground_truth": 0}, {"key": "26d0a5624f3ee7605833c641da5d88e2259b1162", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.4339814668979639, "ground_truth": 0}, {"key": "7e43e9a2c67829721ff9f68147285c579e2c8a70", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.009303949208678317, "ground_truth": 0}, {"key": "7e43e9a2c67829721ff9f68147285c579e2c8a70", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.0075772411141054015, "ground_truth": 0}, {"key": "7e43e9a2c67829721ff9f68147285c579e2c8a70", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.02194825389097645, "ground_truth": 0}, {"key": "7e43e9a2c67829721ff9f68147285c579e2c8a70", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.030444349722370645, "ground_truth": 0}, {"key": "7e43e9a2c67829721ff9f68147285c579e2c8a70", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.010986942521054173, "ground_truth": 0}, {"key": "2137ee3e39b5c0d12e17bbd1e10eb75495a3a83b", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.06465349023640443, "ground_truth": 0}, {"key": "2137ee3e39b5c0d12e17bbd1e10eb75495a3a83b", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.07055959830203556, "ground_truth": 0}, {"key": "2137ee3e39b5c0d12e17bbd1e10eb75495a3a83b", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.07585818205748661, "ground_truth": 0}, {"key": "2137ee3e39b5c0d12e17bbd1e10eb75495a3a83b", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.055208686588027016, "ground_truth": 0}, {"key": "2137ee3e39b5c0d12e17bbd1e10eb75495a3a83b", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.2538610213010029, "ground_truth": 0}, {"key": "31defcc44013caae59c0bdbcedd16be150413bd5", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.10818895535505621, "ground_truth": 0}, {"key": "31defcc44013caae59c0bdbcedd16be150413bd5", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.12506538580436644, "ground_truth": 0}, {"key": "31defcc44013caae59c0bdbcedd16be150413bd5", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.1645164625442329, "ground_truth": 0}, {"key": "31defcc44013caae59c0bdbcedd16be150413bd5", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.5175708780926794, "ground_truth": 0}, {"key": "31defcc44013caae59c0bdbcedd16be150413bd5", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.07107366637554194, "ground_truth": 0}, {"key": "db73dc3466e4e92672d716c1eb2ac9430ac69951", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.6095241614574767, "ground_truth": 0}, {"key": "db73dc3466e4e92672d716c1eb2ac9430ac69951", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.18952109857349456, "ground_truth": 0}, {"key": "db73dc3466e4e92672d716c1eb2ac9430ac69951", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.3942009310461588, "ground_truth": 0}, {"key": "db73dc3466e4e92672d716c1eb2ac9430ac69951", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.5832033503293199, "ground_truth": 0}, {"key": "db73dc3466e4e92672d716c1eb2ac9430ac69951", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.3979384218965851, "ground_truth": 0}, {"key": "3f6308f2f5b6ccdb89d7b6abe1b9490cc30b8e5f", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.13753247715449407, "ground_truth": 0}, {"key": "3f6308f2f5b6ccdb89d7b6abe1b9490cc30b8e5f", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.5078118706515333, "ground_truth": 0}, {"key": "3f6308f2f5b6ccdb89d7b6abe1b9490cc30b8e5f", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.04760265715437723, "ground_truth": 0}, {"key": "3f6308f2f5b6ccdb89d7b6abe1b9490cc30b8e5f", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.16995623333219842, "ground_truth": 0}, {"key": "3f6308f2f5b6ccdb89d7b6abe1b9490cc30b8e5f", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.030675797910812385, "ground_truth": 0}, {"key": "068d37f7a1ee822245dbf9d0d8ddfc281919d7ee", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.4707366413657227, "ground_truth": 0}, {"key": "068d37f7a1ee822245dbf9d0d8ddfc281919d7ee", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.5457699545476874, "ground_truth": 0}, {"key": "068d37f7a1ee822245dbf9d0d8ddfc281919d7ee", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.9378968759366509, "ground_truth": 0}, {"key": "068d37f7a1ee822245dbf9d0d8ddfc281919d7ee", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.38769035882618075, "ground_truth": 0}, {"key": "068d37f7a1ee822245dbf9d0d8ddfc281919d7ee", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.7918210773719991, "ground_truth": 0}, {"key": "bb1e2c23f3fc6edb0ee4bed365cb5567c87a5aa9", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.3191213993607494, "ground_truth": 0}, {"key": "bb1e2c23f3fc6edb0ee4bed365cb5567c87a5aa9", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.2436424424015571, "ground_truth": 0}, {"key": "bb1e2c23f3fc6edb0ee4bed365cb5567c87a5aa9", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.09268777850381534, "ground_truth": 0}, {"key": "bb1e2c23f3fc6edb0ee4bed365cb5567c87a5aa9", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.03635666412052847, "ground_truth": 0}, {"key": "bb1e2c23f3fc6edb0ee4bed365cb5567c87a5aa9", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.064653490819391, "ground_truth": 0}, {"key": "7c72b57e65ddefc77362ed64f7dbc0aebb87ac81", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.8820219873469802, "ground_truth": 0}, {"key": "7c72b57e65ddefc77362ed64f7dbc0aebb87ac81", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.9707987074844977, "ground_truth": 0}, {"key": "7c72b57e65ddefc77362ed64f7dbc0aebb87ac81", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.8360197576329752, "ground_truth": 0}, {"key": "7c72b57e65ddefc77362ed64f7dbc0aebb87ac81", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.895522683854142, "ground_truth": 0}, {"key": "7c72b57e65ddefc77362ed64f7dbc0aebb87ac81", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.9291838043715926, "ground_truth": 0}, {"key": "37a335b36b8d2472825c4624e5449b995726b7a3", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.6406358636976673, "ground_truth": 0}, {"key": "37a335b36b8d2472825c4624e5449b995726b7a3", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.16344543969001285, "ground_truth": 0}, {"key": "37a335b36b8d2472825c4624e5449b995726b7a3", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.6442251257526096, "ground_truth": 0}, {"key": "37a335b36b8d2472825c4624e5449b995726b7a3", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.1379964758899306, "ground_truth": 0}, {"key": "37a335b36b8d2472825c4624e5449b995726b7a3", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.30569733614699884, "ground_truth": 0}, {"key": "da894eb6e5cc104f90ac65e8a124bfcfbfc6578d", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.1480471871267533, "ground_truth": 0}, {"key": "da894eb6e5cc104f90ac65e8a124bfcfbfc6578d", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.6671476699606448, "ground_truth": 0}, {"key": "da894eb6e5cc104f90ac65e8a124bfcfbfc6578d", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.355774896711958, "ground_truth": 0}, {"key": "da894eb6e5cc104f90ac65e8a124bfcfbfc6578d", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.4130035834772528, "ground_truth": 0}, {"key": "da894eb6e5cc104f90ac65e8a124bfcfbfc6578d", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.45132652610175483, "ground_truth": 0}, {"key": "b7697e424512e656efe5f2aca17bc33cfe0a2b20", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.02489280083935899, "ground_truth": 0}, {"key": "b7697e424512e656efe5f2aca17bc33cfe0a2b20", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.03622005905834994, "ground_truth": 0}, {"key": "b7697e424512e656efe5f2aca17bc33cfe0a2b20", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.008093291006881618, "ground_truth": 0}, {"key": "b7697e424512e656efe5f2aca17bc33cfe0a2b20", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.04336579969875671, "ground_truth": 0}, {"key": "b7697e424512e656efe5f2aca17bc33cfe0a2b20", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.01941934711113292, "ground_truth": 0}, {"key": "2292d4348e59aafbe93f3040af23fdff448a6cac", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.29340448839611893, "ground_truth": 0}, {"key": "2292d4348e59aafbe93f3040af23fdff448a6cac", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.5009765605479394, "ground_truth": 0}, {"key": "2292d4348e59aafbe93f3040af23fdff448a6cac", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.4649015741614812, "ground_truth": 0}, {"key": "2292d4348e59aafbe93f3040af23fdff448a6cac", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.7826624844583321, "ground_truth": 0}, {"key": "2292d4348e59aafbe93f3040af23fdff448a6cac", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.3048688643416971, "ground_truth": 0}, {"key": "8ed7e0c5e15275537f2c1d5d945e95709d7dc6bf", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.3665897238827359, "ground_truth": 0}, {"key": "8ed7e0c5e15275537f2c1d5d945e95709d7dc6bf", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.08882029276769632, "ground_truth": 0}, {"key": "8ed7e0c5e15275537f2c1d5d945e95709d7dc6bf", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.026759282777720342, "ground_truth": 0}, {"key": "8ed7e0c5e15275537f2c1d5d945e95709d7dc6bf", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.10894503670929614, "ground_truth": 0}, {"key": "8ed7e0c5e15275537f2c1d5d945e95709d7dc6bf", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.1066905978651883, "ground_truth": 0}, {"key": "6b22be31a2cefb2fdd302b8ff788335f23f5dbad", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.15713684586210097, "ground_truth": 0}, {"key": "6b22be31a2cefb2fdd302b8ff788335f23f5dbad", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.2674081591581039, "ground_truth": 0}, {"key": "6b22be31a2cefb2fdd302b8ff788335f23f5dbad", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.27512973180549427, "ground_truth": 0}, {"key": "6b22be31a2cefb2fdd302b8ff788335f23f5dbad", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.5926666037140623, "ground_truth": 0}, {"key": "6b22be31a2cefb2fdd302b8ff788335f23f5dbad", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.3849121646148615, "ground_truth": 0}, {"key": "686caba1039a286aca406e0bbac00aebb198fda5", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.10052486567345835, "ground_truth": 0}, {"key": "686caba1039a286aca406e0bbac00aebb198fda5", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.33458944655913153, "ground_truth": 0}, {"key": "686caba1039a286aca406e0bbac00aebb198fda5", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.300745588888594, "ground_truth": 0}, {"key": "686caba1039a286aca406e0bbac00aebb198fda5", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.15713685422204335, "ground_truth": 0}, {"key": "686caba1039a286aca406e0bbac00aebb198fda5", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.13846179209228687, "ground_truth": 0}, {"key": "3c84e13d5941fdbe626183cdf1dca9b5df6c8f92", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.3040416793636448, "ground_truth": 0}, {"key": "3c84e13d5941fdbe626183cdf1dca9b5df6c8f92", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.670608278030076, "ground_truth": 0}, {"key": "3c84e13d5941fdbe626183cdf1dca9b5df6c8f92", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.4111108623750161, "ground_truth": 0}, {"key": "3c84e13d5941fdbe626183cdf1dca9b5df6c8f92", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.426321590310365, "ground_truth": 0}, {"key": "3c84e13d5941fdbe626183cdf1dca9b5df6c8f92", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.5765419739655674, "ground_truth": 0}, {"key": "7f5fd7614f32586747f65545bebba418c3679d12", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.1259227688008469, "ground_truth": 0}, {"key": "7f5fd7614f32586747f65545bebba418c3679d12", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.09367799725857406, "ground_truth": 0}, {"key": "7f5fd7614f32586747f65545bebba418c3679d12", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.18832398943755335, "ground_truth": 0}, {"key": "7f5fd7614f32586747f65545bebba418c3679d12", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.060529389530360404, "ground_truth": 0}, {"key": "7f5fd7614f32586747f65545bebba418c3679d12", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.18242553491109761, "ground_truth": 0}, {"key": "186210bbc060c272ff9a2412ec2e711a3e4a5e6e", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.7752646933197905, "ground_truth": 0}, {"key": "186210bbc060c272ff9a2412ec2e711a3e4a5e6e", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.6825737130211811, "ground_truth": 0}, {"key": "186210bbc060c272ff9a2412ec2e711a3e4a5e6e", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.1835936326394725, "ground_truth": 0}, {"key": "186210bbc060c272ff9a2412ec2e711a3e4a5e6e", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.2309197558321109, "ground_truth": 0}, {"key": "186210bbc060c272ff9a2412ec2e711a3e4a5e6e", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.6057990765428898, "ground_truth": 0}, {"key": "03392835ea832d7940082c421a21778c70701ff0", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.46490157457590514, "ground_truth": 0}, {"key": "03392835ea832d7940082c421a21778c70701ff0", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.6825737130211811, "ground_truth": 0}, {"key": "03392835ea832d7940082c421a21778c70701ff0", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.25386101581026416, "ground_truth": 0}, {"key": "03392835ea832d7940082c421a21778c70701ff0", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.1937568714770546, "ground_truth": 0}, {"key": "03392835ea832d7940082c421a21778c70701ff0", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.2114168143059999, "ground_truth": 0}, {"key": "e2b96982b60cbd10b39c1db4282023d0ac1f3f2a", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.27435136483622885, "ground_truth": 0}, {"key": "e2b96982b60cbd10b39c1db4282023d0ac1f3f2a", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.5331544087014372, "ground_truth": 0}, {"key": "e2b96982b60cbd10b39c1db4282023d0ac1f3f2a", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.32852943628350567, "ground_truth": 0}, {"key": "e2b96982b60cbd10b39c1db4282023d0ac1f3f2a", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.4882834209326547, "ground_truth": 0}, {"key": "e2b96982b60cbd10b39c1db4282023d0ac1f3f2a", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.4571367468277059, "ground_truth": 0}, {"key": "31310358d02c98abba71916e8cb4ef7477a2d82a", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.0025809040286248262, "ground_truth": 0}, {"key": "31310358d02c98abba71916e8cb4ef7477a2d82a", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.01530635445972251, "ground_truth": 0}, {"key": "31310358d02c98abba71916e8cb4ef7477a2d82a", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.02396202585878563, "ground_truth": 0}, {"key": "31310358d02c98abba71916e8cb4ef7477a2d82a", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.009783875268997355, "ground_truth": 0}, {"key": "31310358d02c98abba71916e8cb4ef7477a2d82a", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.04256273302433886, "ground_truth": 0}, {"key": "ec0e9a0c77bbb4bba73ef5177413c666e691850d", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.3433417213125602, "ground_truth": 0}, {"key": "ec0e9a0c77bbb4bba73ef5177413c666e691850d", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.5009765605479394, "ground_truth": 0}, {"key": "ec0e9a0c77bbb4bba73ef5177413c666e691850d", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.2751297226114839, "ground_truth": 0}, {"key": "ec0e9a0c77bbb4bba73ef5177413c666e691850d", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.757076695339686, "ground_truth": 0}, {"key": "ec0e9a0c77bbb4bba73ef5177413c666e691850d", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.2523840452627884, "ground_truth": 0}, {"key": "02311be4aab97a81d2262963896b975c27f6503d", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.24798743940918924, "ground_truth": 0}, {"key": "02311be4aab97a81d2262963896b975c27f6503d", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.6242935207073033, "ground_truth": 0}, {"key": "02311be4aab97a81d2262963896b975c27f6503d", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.5486734741229118, "ground_truth": 0}, {"key": "02311be4aab97a81d2262963896b975c27f6503d", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.3415824893939354, "ground_truth": 0}, {"key": "02311be4aab97a81d2262963896b975c27f6503d", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.5602526639272581, "ground_truth": 0}, {"key": "a18b463219c663ef55a0cbbf81ae489cdf877b62", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.715423987791089, "ground_truth": 0}, {"key": "a18b463219c663ef55a0cbbf81ae489cdf877b62", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.814052827599711, "ground_truth": 0}, {"key": "a18b463219c663ef55a0cbbf81ae489cdf877b62", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.8723473794197174, "ground_truth": 0}, {"key": "a18b463219c663ef55a0cbbf81ae489cdf877b62", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.8624675342229652, "ground_truth": 0}, {"key": "a18b463219c663ef55a0cbbf81ae489cdf877b62", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.7217431882861669, "ground_truth": 0}, {"key": "aa966ac9e3611ac2cef8d3fb9ceb3b58c150e238", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.3345894403130363, "ground_truth": 0}, {"key": "aa966ac9e3611ac2cef8d3fb9ceb3b58c150e238", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.8852352196271853, "ground_truth": 0}, {"key": "aa966ac9e3611ac2cef8d3fb9ceb3b58c150e238", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.40922078415631075, "ground_truth": 0}, {"key": "aa966ac9e3611ac2cef8d3fb9ceb3b58c150e238", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.6020615660567673, "ground_truth": 0}, {"key": "aa966ac9e3611ac2cef8d3fb9ceb3b58c150e238", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.48047867361946783, "ground_truth": 0}, {"key": "5215d4e6e945ba390786f1720cc5a8abf92c32fd", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.02953533897185307, "ground_truth": 0}, {"key": "5215d4e6e945ba390786f1720cc5a8abf92c32fd", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.020645930858367145, "ground_truth": 0}, {"key": "5215d4e6e945ba390786f1720cc5a8abf92c32fd", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.043365798682287196, "ground_truth": 0}, {"key": "5215d4e6e945ba390786f1720cc5a8abf92c32fd", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.040237944265743654, "ground_truth": 0}, {"key": "5215d4e6e945ba390786f1720cc5a8abf92c32fd", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.13386748898068926, "ground_truth": 0}, {"key": "e7297f59909379c8eb07ea9bc2377b5e3980073d", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.5869964291313335, "ground_truth": 0}, {"key": "e7297f59909379c8eb07ea9bc2377b5e3980073d", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.16344543969001285, "ground_truth": 0}, {"key": "e7297f59909379c8eb07ea9bc2377b5e3980073d", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.35398629374732715, "ground_truth": 0}, {"key": "e7297f59909379c8eb07ea9bc2377b5e3980073d", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.12168575229908228, "ground_truth": 0}, {"key": "e7297f59909379c8eb07ea9bc2377b5e3980073d", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.30569733614699884, "ground_truth": 0}, {"key": "6c5f775006a225e617c1fa4cf0c439579e1443a2", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.1907240142061102, "ground_truth": 0}, {"key": "6c5f775006a225e617c1fa4cf0c439579e1443a2", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.16451645187238223, "ground_truth": 0}, {"key": "6c5f775006a225e617c1fa4cf0c439579e1443a2", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.07290026884273888, "ground_truth": 0}, {"key": "6c5f775006a225e617c1fa4cf0c439579e1443a2", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.040237942863810695, "ground_truth": 0}, {"key": "6c5f775006a225e617c1fa4cf0c439579e1443a2", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.06632686614664851, "ground_truth": 0}, {"key": "46ce664a42eac4474d25c435a28790ec25137603", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.12678517436635747, "ground_truth": 0}, {"key": "46ce664a42eac4474d25c435a28790ec25137603", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.05070536088579937, "ground_truth": 0}, {"key": "46ce664a42eac4474d25c435a28790ec25137603", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.050893726010294085, "ground_truth": 0}, {"key": "46ce664a42eac4474d25c435a28790ec25137603", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.039638839137284027, "ground_truth": 0}, {"key": "46ce664a42eac4474d25c435a28790ec25137603", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.015603533213575303, "ground_truth": 0}, {"key": "693d73ab049f7d8f3c897922b3f7269a96a1a4fa", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.08389038939491616, "ground_truth": 0}, {"key": "693d73ab049f7d8f3c897922b3f7269a96a1a4fa", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.09636510632358415, "ground_truth": 0}, {"key": "693d73ab049f7d8f3c897922b3f7269a96a1a4fa", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.06705628474745395, "ground_truth": 0}, {"key": "693d73ab049f7d8f3c897922b3f7269a96a1a4fa", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.14128141637674235, "ground_truth": 0}, {"key": "693d73ab049f7d8f3c897922b3f7269a96a1a4fa", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.07696083709134124, "ground_truth": 0}, {"key": "48e4930e3c380330b609f460f11520be0e29d5fd", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.35309354785579156, "ground_truth": 0}, {"key": "48e4930e3c380330b609f460f11520be0e29d5fd", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.7937461968392681, "ground_truth": 0}, {"key": "48e4930e3c380330b609f460f11520be0e29d5fd", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.2553436431819706, "ground_truth": 0}, {"key": "48e4930e3c380330b609f460f11520be0e29d5fd", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.367497247942093, "ground_truth": 0}, {"key": "48e4930e3c380330b609f460f11520be0e29d5fd", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.5784481720923277, "ground_truth": 0}, {"key": "53f3e11ada213ff55b987692a2eb0c9b6d890d5e", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.016277461407455292, "ground_truth": 0}, {"key": "53f3e11ada213ff55b987692a2eb0c9b6d890d5e", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.006957608508330746, "ground_truth": 0}, {"key": "53f3e11ada213ff55b987692a2eb0c9b6d890d5e", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.0012843082473623184, "ground_truth": 0}, {"key": "53f3e11ada213ff55b987692a2eb0c9b6d890d5e", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.012053779466825334, "ground_truth": 0}, {"key": "53f3e11ada213ff55b987692a2eb0c9b6d890d5e", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.0031480704374368756, "ground_truth": 0}, {"key": "d2ee859acf7e35bea229f968d53240c2f1c2845c", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.1710611789221486, "ground_truth": 0}, {"key": "d2ee859acf7e35bea229f968d53240c2f1c2845c", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.1225232189092927, "ground_truth": 0}, {"key": "d2ee859acf7e35bea229f968d53240c2f1c2845c", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.30902369926014794, "ground_truth": 0}, {"key": "d2ee859acf7e35bea229f968d53240c2f1c2845c", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.042722197238618864, "ground_truth": 0}, {"key": "d2ee859acf7e35bea229f968d53240c2f1c2845c", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.030214588814827345, "ground_truth": 0}, {"key": "d4d44650eb77504fd01a730c0ccc7e6cdfcc578a", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.6601723753323131, "ground_truth": 0}, {"key": "d4d44650eb77504fd01a730c0ccc7e6cdfcc578a", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.2509127960530232, "ground_truth": 0}, {"key": "d4d44650eb77504fd01a730c0ccc7e6cdfcc578a", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.1490353022957925, "ground_truth": 0}, {"key": "d4d44650eb77504fd01a730c0ccc7e6cdfcc578a", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.46101679307778665, "ground_truth": 0}, {"key": "d4d44650eb77504fd01a730c0ccc7e6cdfcc578a", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.30074559322750577, "ground_truth": 0}, {"key": "3695132378151f89d210da575bfef0a3f29aa051", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.07864237848487247, "ground_truth": 0}, {"key": "3695132378151f89d210da575bfef0a3f29aa051", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.11596071042003905, "ground_truth": 0}, {"key": "3695132378151f89d210da575bfef0a3f29aa051", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.1550784726339132, "ground_truth": 0}, {"key": "3695132378151f89d210da575bfef0a3f29aa051", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.09268777335487254, "ground_truth": 0}, {"key": "3695132378151f89d210da575bfef0a3f29aa051", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.10594828281146523, "ground_truth": 0}, {"key": "c193cecd478fa204b16500ece25bf25b75bc5265", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.10338595861618433, "ground_truth": 0}, {"key": "c193cecd478fa204b16500ece25bf25b75bc5265", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.7178037938840451, "ground_truth": 0}, {"key": "c193cecd478fa204b16500ece25bf25b75bc5265", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.1907240242292246, "ground_truth": 0}, {"key": "c193cecd478fa204b16500ece25bf25b75bc5265", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.12210387024540316, "ground_truth": 0}, {"key": "c193cecd478fa204b16500ece25bf25b75bc5265", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.06441766038590213, "ground_truth": 0}, {"key": "b599d61b0c28b86dc92c7af4d40814ece8279500", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.0888202877444003, "ground_truth": 0}, {"key": "b599d61b0c28b86dc92c7af4d40814ece8279500", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.09268777556183433, "ground_truth": 0}, {"key": "b599d61b0c28b86dc92c7af4d40814ece8279500", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.33285233575655443, "ground_truth": 0}, {"key": "b599d61b0c28b86dc92c7af4d40814ece8279500", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.031858856879935865, "ground_truth": 0}, {"key": "b599d61b0c28b86dc92c7af4d40814ece8279500", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.012431651112775222, "ground_truth": 0}, {"key": "06f290a163e81c46437ca61b5fd13741d7db11f2", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.04304284756140938, "ground_truth": 0}, {"key": "06f290a163e81c46437ca61b5fd13741d7db11f2", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.04401865369366616, "ground_truth": 0}, {"key": "06f290a163e81c46437ca61b5fd13741d7db11f2", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.06954174364443087, "ground_truth": 0}, {"key": "06f290a163e81c46437ca61b5fd13741d7db11f2", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.04849600040133519, "ground_truth": 0}, {"key": "06f290a163e81c46437ca61b5fd13741d7db11f2", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.1789558996687336, "ground_truth": 0}, {"key": "46210bd0b15cd5bba64751d873674766decb2677", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.11085559418444542, "ground_truth": 0}, {"key": "46210bd0b15cd5bba64751d873674766decb2677", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.3157359630578731, "ground_truth": 0}, {"key": "46210bd0b15cd5bba64751d873674766decb2677", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.11596071369748308, "ground_truth": 0}, {"key": "46210bd0b15cd5bba64751d873674766decb2677", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.1302854198091758, "ground_truth": 0}, {"key": "46210bd0b15cd5bba64751d873674766decb2677", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.05728197610871876, "ground_truth": 0}, {"key": "cfba701dad16c47e0f7b97b8a6b043d25f740085", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.0987725827269146, "ground_truth": 0}, {"key": "cfba701dad16c47e0f7b97b8a6b043d25f740085", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.07807816242397628, "ground_truth": 0}, {"key": "cfba701dad16c47e0f7b97b8a6b043d25f740085", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.1294027241710251, "ground_truth": 0}, {"key": "cfba701dad16c47e0f7b97b8a6b043d25f740085", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.11047115045886048, "ground_truth": 0}, {"key": "cfba701dad16c47e0f7b97b8a6b043d25f740085", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.15304215598916474, "ground_truth": 0}, {"key": "1c0fbe7e6758334d83d145580688e7aa1c549c53", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.023689472195301656, "ground_truth": 0}, {"key": "1c0fbe7e6758334d83d145580688e7aa1c549c53", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.0325897420736699, "ground_truth": 0}, {"key": "1c0fbe7e6758334d83d145580688e7aa1c549c53", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.052618954731016125, "ground_truth": 0}, {"key": "1c0fbe7e6758334d83d145580688e7aa1c549c53", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.03010033795923536, "ground_truth": 0}, {"key": "1c0fbe7e6758334d83d145580688e7aa1c549c53", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.10302443117631752, "ground_truth": 0}, {"key": "820c917dada8b32be365eaeec9edc1ca5833cfcd", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.3157359717948783, "ground_truth": 0}, {"key": "820c917dada8b32be365eaeec9edc1ca5833cfcd", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.11397345811051275, "ground_truth": 0}, {"key": "820c917dada8b32be365eaeec9edc1ca5833cfcd", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.24944723253516293, "ground_truth": 0}, {"key": "820c917dada8b32be365eaeec9edc1ca5833cfcd", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.16995624682111032, "ground_truth": 0}, {"key": "820c917dada8b32be365eaeec9edc1ca5833cfcd", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.1412814204705914, "ground_truth": 0}, {"key": "faf3821150b0c63290cbbddd7a8b54900995ea5a", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.02153287861567017, "ground_truth": 0}, {"key": "faf3821150b0c63290cbbddd7a8b54900995ea5a", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.10447731502916417, "ground_truth": 0}, {"key": "faf3821150b0c63290cbbddd7a8b54900995ea5a", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.012431651187540603, "ground_truth": 0}, {"key": "faf3821150b0c63290cbbddd7a8b54900995ea5a", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.026056304993519692, "ground_truth": 0}, {"key": "faf3821150b0c63290cbbddd7a8b54900995ea5a", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.018833131306113263, "ground_truth": 0}, {"key": "1de0cae2832cf41f49e6fad8254247c789dfabd2", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.06512754810910015, "ground_truth": 0}, {"key": "1de0cae2832cf41f49e6fad8254247c789dfabd2", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.06656919013796757, "ground_truth": 0}, {"key": "1de0cae2832cf41f49e6fad8254247c789dfabd2", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.06754669441300219, "ground_truth": 0}, {"key": "1de0cae2832cf41f49e6fad8254247c789dfabd2", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.02832831247344853, "ground_truth": 0}, {"key": "1de0cae2832cf41f49e6fad8254247c789dfabd2", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.058560827652699904, "ground_truth": 0}, {"key": "6c6e51ef20def117ed9114ed8d8480b3a100f1c3", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.04742587364500934, "ground_truth": 0}, {"key": "6c6e51ef20def117ed9114ed8d8480b3a100f1c3", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.12336561351619517, "ground_truth": 0}, {"key": "6c6e51ef20def117ed9114ed8d8480b3a100f1c3", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.029423578790592708, "ground_truth": 0}, {"key": "6c6e51ef20def117ed9114ed8d8480b3a100f1c3", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.04054073815440905, "ground_truth": 0}, {"key": "6c6e51ef20def117ed9114ed8d8480b3a100f1c3", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.05127242203087133, "ground_truth": 0}, {"key": "b8c755b8921f7917d161605d2ef404d9551f3846", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.8444090090977385, "ground_truth": 0}, {"key": "b8c755b8921f7917d161605d2ef404d9551f3846", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.16885695311520035, "ground_truth": 0}, {"key": "b8c755b8921f7917d161605d2ef404d9551f3846", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.5717666184705524, "ground_truth": 0}, {"key": "b8c755b8921f7917d161605d2ef404d9551f3846", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.2829881277631244, "ground_truth": 0}, {"key": "b8c755b8921f7917d161605d2ef404d9551f3846", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.22405547206894413, "ground_truth": 0}, {"key": "dc7e18d14b8ad29abbd79f554324ec7b8ba8b9c0", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.5736784167216447, "ground_truth": 0}, {"key": "dc7e18d14b8ad29abbd79f554324ec7b8ba8b9c0", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.32082131275686576, "ground_truth": 0}, {"key": "dc7e18d14b8ad29abbd79f554324ec7b8ba8b9c0", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.49804686200197756, "ground_truth": 0}, {"key": "dc7e18d14b8ad29abbd79f554324ec7b8ba8b9c0", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.7272012175156564, "ground_truth": 0}, {"key": "dc7e18d14b8ad29abbd79f554324ec7b8ba8b9c0", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.5136684620787466, "ground_truth": 0}, {"key": "a7fc90db6c296663b1b7fc057451dfd45019342d", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.014009566581246134, "ground_truth": 0}, {"key": "a7fc90db6c296663b1b7fc057451dfd45019342d", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.0456920329930522, "ground_truth": 0}, {"key": "a7fc90db6c296663b1b7fc057451dfd45019342d", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.048857780681966965, "ground_truth": 0}, {"key": "a7fc90db6c296663b1b7fc057451dfd45019342d", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.02585877674107066, "ground_truth": 0}, {"key": "a7fc90db6c296663b1b7fc057451dfd45019342d", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.02002344029685899, "ground_truth": 0}, {"key": "7f22fbc4fd81e50c632c5853856965aa4d0065d4", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.142709139071213, "ground_truth": 0}, {"key": "7f22fbc4fd81e50c632c5853856965aa4d0065d4", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.10932481921295001, "ground_truth": 0}, {"key": "7f22fbc4fd81e50c632c5853856965aa4d0065d4", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.5156199168468167, "ground_truth": 0}, {"key": "7f22fbc4fd81e50c632c5853856965aa4d0065d4", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.155590987455784, "ground_truth": 0}, {"key": "7f22fbc4fd81e50c632c5853856965aa4d0065d4", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.21866936984968505, "ground_truth": 0}, {"key": "309ae632df7b88a9569d81fa91aff3b9fb03529e", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.13477592050125506, "ground_truth": 0}, {"key": "309ae632df7b88a9569d81fa91aff3b9fb03529e", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.1841798507073207, "ground_truth": 0}, {"key": "309ae632df7b88a9569d81fa91aff3b9fb03529e", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.27669052835229146, "ground_truth": 0}, {"key": "309ae632df7b88a9569d81fa91aff3b9fb03529e", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.07263670931513624, "ground_truth": 0}, {"key": "309ae632df7b88a9569d81fa91aff3b9fb03529e", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.12336561427705346, "ground_truth": 0}, {"key": "732304a0901ff14d023d4361c1d41a85724808f3", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.043854563649093424, "ground_truth": 0}, {"key": "732304a0901ff14d023d4361c1d41a85724808f3", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.2337063397681973, "ground_truth": 0}, {"key": "732304a0901ff14d023d4361c1d41a85724808f3", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.014503580281461407, "ground_truth": 0}, {"key": "732304a0901ff14d023d4361c1d41a85724808f3", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.055617613780672676, "ground_truth": 0}, {"key": "732304a0901ff14d023d4361c1d41a85724808f3", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.05623634683688607, "ground_truth": 0}, {"key": "509b9f69b376e4acb8da49d53198699b1e779ea7", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.034229319322866526, "ground_truth": 0}, {"key": "509b9f69b376e4acb8da49d53198699b1e779ea7", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.08389039054927032, "ground_truth": 0}, {"key": "509b9f69b376e4acb8da49d53198699b1e779ea7", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.05340333287668101, "ground_truth": 0}, {"key": "509b9f69b376e4acb8da49d53198699b1e779ea7", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.053009768589573104, "ground_truth": 0}, {"key": "509b9f69b376e4acb8da49d53198699b1e779ea7", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.07531230500553528, "ground_truth": 0}, {"key": "c292860b41f7c9131458cdc44a79febef38ad8a2", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.0729002689757056, "ground_truth": 0}, {"key": "c292860b41f7c9131458cdc44a79febef38ad8a2", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.09009299689283526, "ground_truth": 0}, {"key": "c292860b41f7c9131458cdc44a79febef38ad8a2", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.007149102011428538, "ground_truth": 0}, {"key": "c292860b41f7c9131458cdc44a79febef38ad8a2", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.054399318067815526, "ground_truth": 0}, {"key": "c292860b41f7c9131458cdc44a79febef38ad8a2", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.03732688745553151, "ground_truth": 0}, {"key": "6db7e70883f0241081833487c421bab86fdac26e", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.016785490900389537, "ground_truth": 0}, {"key": "6db7e70883f0241081833487c421bab86fdac26e", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.043691059167156585, "ground_truth": 0}, {"key": "6db7e70883f0241081833487c421bab86fdac26e", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.009522485476927373, "ground_truth": 0}, {"key": "6db7e70883f0241081833487c421bab86fdac26e", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.00793799395817816, "ground_truth": 0}, {"key": "6db7e70883f0241081833487c421bab86fdac26e", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.046378208478239154, "ground_truth": 0}, {"key": "e51e06234b3f49da16fec69aaee6fb9cd09cb1d8", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.20946969534891194, "ground_truth": 0}, {"key": "e51e06234b3f49da16fec69aaee6fb9cd09cb1d8", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.2643583701854095, "ground_truth": 0}, {"key": "e51e06234b3f49da16fec69aaee6fb9cd09cb1d8", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.09334687186206443, "ground_truth": 0}, {"key": "e51e06234b3f49da16fec69aaee6fb9cd09cb1d8", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.2658804749420943, "ground_truth": 0}, {"key": "e51e06234b3f49da16fec69aaee6fb9cd09cb1d8", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.10194652123002705, "ground_truth": 0}, {"key": "42474528588bac3a27842671a3fa940fed450552", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.0920328652699032, "ground_truth": 0}, {"key": "42474528588bac3a27842671a3fa940fed450552", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.33285234712438333, "ground_truth": 0}, {"key": "42474528588bac3a27842671a3fa940fed450552", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.19314738612835125, "ground_truth": 0}, {"key": "42474528588bac3a27842671a3fa940fed450552", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.11596072222712706, "ground_truth": 0}, {"key": "42474528588bac3a27842671a3fa940fed450552", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.49804687760139105, "ground_truth": 0}, {"key": "5932d9c8f1da55bad396197ebae0853c515180a5", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.33285235422834747, "ground_truth": 0}, {"key": "5932d9c8f1da55bad396197ebae0853c515180a5", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.12765261815863566, "ground_truth": 0}, {"key": "5932d9c8f1da55bad396197ebae0853c515180a5", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.22678362354928158, "ground_truth": 0}, {"key": "5932d9c8f1da55bad396197ebae0853c515180a5", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.5214711645366678, "ground_truth": 0}, {"key": "5932d9c8f1da55bad396197ebae0853c515180a5", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.30074557466734625, "ground_truth": 0}, {"key": "daacc676fc659bfd147d11b1409ab42615a2f169", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.2056150529040479, "ground_truth": 0}, {"key": "daacc676fc659bfd147d11b1409ab42615a2f169", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.4921881183807294, "ground_truth": 0}, {"key": "daacc676fc659bfd147d11b1409ab42615a2f169", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.4455295313084324, "ground_truth": 0}, {"key": "daacc676fc659bfd147d11b1409ab42615a2f169", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.45907614470139746, "ground_truth": 0}, {"key": "daacc676fc659bfd147d11b1409ab42615a2f169", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.45713672745226047, "ground_truth": 0}, {"key": "7a02e707b139791920fb13115d6132541fff7d97", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.054198733112676936, "ground_truth": 0}, {"key": "7a02e707b139791920fb13115d6132541fff7d97", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.2568320093266548, "ground_truth": 0}, {"key": "7a02e707b139791920fb13115d6132541fff7d97", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.1329642418367418, "ground_truth": 0}, {"key": "7a02e707b139791920fb13115d6132541fff7d97", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.16451645609917864, "ground_truth": 0}, {"key": "7a02e707b139791920fb13115d6132541fff7d97", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.2861692566362167, "ground_truth": 0}, {"key": "db1972f0204c7a9c292f4c85e8838251cb26625e", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.44552954295550146, "ground_truth": 0}, {"key": "db1972f0204c7a9c292f4c85e8838251cb26625e", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.1001722212628393, "ground_truth": 0}, {"key": "db1972f0204c7a9c292f4c85e8838251cb26625e", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.35756752091367366, "ground_truth": 0}, {"key": "db1972f0204c7a9c292f4c85e8838251cb26625e", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.2829881253628118, "ground_truth": 0}, {"key": "db1972f0204c7a9c292f4c85e8838251cb26625e", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.40922079320533705, "ground_truth": 0}, {"key": "6defcdfd6995661fd681dc15163d67f6a5d6727b", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.8140528170652275, "ground_truth": 0}, {"key": "6defcdfd6995661fd681dc15163d67f6a5d6727b", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.7556370006731536, "ground_truth": 0}, {"key": "6defcdfd6995661fd681dc15163d67f6a5d6727b", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.9544779932121036, "ground_truth": 0}, {"key": "6defcdfd6995661fd681dc15163d67f6a5d6727b", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.6352224402399222, "ground_truth": 0}, {"key": "6defcdfd6995661fd681dc15163d67f6a5d6727b", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.7138307638702271, "ground_truth": 0}, {"key": "24716f5a39d23dafbe9a9df8fa002788d14d020b", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.04115288758410097, "ground_truth": 0}, {"key": "24716f5a39d23dafbe9a9df8fa002788d14d020b", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.19559406808128485, "ground_truth": 0}, {"key": "24716f5a39d23dafbe9a9df8fa002788d14d020b", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.08093671278997923, "ground_truth": 0}, {"key": "24716f5a39d23dafbe9a9df8fa002788d14d020b", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.09739039411428387, "ground_truth": 0}, {"key": "24716f5a39d23dafbe9a9df8fa002788d14d020b", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.11476477871433864, "ground_truth": 0}, {"key": "ab3c98cf7833b842898a568d872e45ceb2f7dda9", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.0413073035912617, "ground_truth": 0}, {"key": "ab3c98cf7833b842898a568d872e45ceb2f7dda9", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.018905445552244573, "ground_truth": 0}, {"key": "ab3c98cf7833b842898a568d872e45ceb2f7dda9", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.08064661835479273, "ground_truth": 0}, {"key": "ab3c98cf7833b842898a568d872e45ceb2f7dda9", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.009412589602362435, "ground_truth": 0}, {"key": "ab3c98cf7833b842898a568d872e45ceb2f7dda9", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.010448625745114985, "ground_truth": 0}, {"key": "831005755f85012c882f17c3b3699b34a7febb7b", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.8558511473252645, "ground_truth": 0}, {"key": "831005755f85012c882f17c3b3699b34a7febb7b", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.8327813339891187, "ground_truth": 0}, {"key": "831005755f85012c882f17c3b3699b34a7febb7b", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.8832359839438259, "ground_truth": 0}, {"key": "831005755f85012c882f17c3b3699b34a7febb7b", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.6406358530070692, "ground_truth": 0}, {"key": "831005755f85012c882f17c3b3699b34a7febb7b", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.5097643597527355, "ground_truth": 0}, {"key": "0590a8c653b7d332d9df195dcf3ce014abb4eff7", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.1200256393807427, "ground_truth": 0}, {"key": "0590a8c653b7d332d9df195dcf3ce014abb4eff7", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.6001883437973046, "ground_truth": 0}, {"key": "0590a8c653b7d332d9df195dcf3ce014abb4eff7", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.1233656151865789, "ground_truth": 0}, {"key": "0590a8c653b7d332d9df195dcf3ce014abb4eff7", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.11516223260683443, "ground_truth": 0}, {"key": "0590a8c653b7d332d9df195dcf3ce014abb4eff7", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.12252321393161818, "ground_truth": 0}, {"key": "f79341438eed40986c3219b67a3b5d87eb6c018a", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.4397473335944505, "ground_truth": 0}, {"key": "f79341438eed40986c3219b67a3b5d87eb6c018a", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.2523840467925765, "ground_truth": 0}, {"key": "f79341438eed40986c3219b67a3b5d87eb6c018a", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.11357958853901089, "ground_truth": 0}, {"key": "f79341438eed40986c3219b67a3b5d87eb6c018a", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.40356686346426535, "ground_truth": 0}, {"key": "f79341438eed40986c3219b67a3b5d87eb6c018a", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.22135067667077227, "ground_truth": 0}, {"key": "8db6225f67580d64a196f2f3197386a6be950a09", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.9390248194676284, "ground_truth": 0}, {"key": "8db6225f67580d64a196f2f3197386a6be950a09", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.8860265423404338, "ground_truth": 0}, {"key": "8db6225f67580d64a196f2f3197386a6be950a09", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.9791955095425979, "ground_truth": 0}, {"key": "8db6225f67580d64a196f2f3197386a6be950a09", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.7356416397864328, "ground_truth": 0}, {"key": "8db6225f67580d64a196f2f3197386a6be950a09", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.8879840420900219, "ground_truth": 0}, {"key": "e386d9ed70bac668fa6048b572f445d9b7b62f75", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.14706452606200776, "ground_truth": 0}, {"key": "e386d9ed70bac668fa6048b572f445d9b7b62f75", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.16559311743562713, "ground_truth": 0}, {"key": "e386d9ed70bac668fa6048b572f445d9b7b62f75", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.3593641352100755, "ground_truth": 0}, {"key": "e386d9ed70bac668fa6048b572f445d9b7b62f75", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.12678517683435636, "ground_truth": 0}, {"key": "e386d9ed70bac668fa6048b572f445d9b7b62f75", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.3007455985758028, "ground_truth": 0}, {"key": "e35669d4530ea55bc8f0e451268cab9e9eaeab92", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.5467381451956814, "ground_truth": 0}, {"key": "e35669d4530ea55bc8f0e451268cab9e9eaeab92", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.8872046053375798, "ground_truth": 0}, {"key": "e35669d4530ea55bc8f0e451268cab9e9eaeab92", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.8962513674700037, "ground_truth": 0}, {"key": "e35669d4530ea55bc8f0e451268cab9e9eaeab92", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.8568122914426919, "ground_truth": 0}, {"key": "e35669d4530ea55bc8f0e451268cab9e9eaeab92", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.43014734018949763, "ground_truth": 0}, {"key": "d3ca193f45aef9aa766d52fbc58d6b8f1658ee60", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.1320661477211273, "ground_truth": 0}, {"key": "d3ca193f45aef9aa766d52fbc58d6b8f1658ee60", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.49804686903891465, "ground_truth": 0}, {"key": "d3ca193f45aef9aa766d52fbc58d6b8f1658ee60", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.17328820779598494, "ground_truth": 0}, {"key": "d3ca193f45aef9aa766d52fbc58d6b8f1658ee60", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.09807933216355501, "ground_truth": 0}, {"key": "d3ca193f45aef9aa766d52fbc58d6b8f1658ee60", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.22815650666626336, "ground_truth": 0}, {"key": "1ca9bf09bf534add02b7cfe6ebae6d17cde66286", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.2674081753121162, "ground_truth": 0}, {"key": "1ca9bf09bf534add02b7cfe6ebae6d17cde66286", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.05877655597781075, "ground_truth": 0}, {"key": "1ca9bf09bf534add02b7cfe6ebae6d17cde66286", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.2751297163914212, "ground_truth": 0}, {"key": "1ca9bf09bf534add02b7cfe6ebae6d17cde66286", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.12421300951226172, "ground_truth": 0}, {"key": "1ca9bf09bf534add02b7cfe6ebae6d17cde66286", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.27982851027647926, "ground_truth": 0}, {"key": "c296e88117bef515bd9b36ad560223df3fd2b84c", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.12002563450796275, "ground_truth": 0}, {"key": "c296e88117bef515bd9b36ad560223df3fd2b84c", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.0753123091178224, "ground_truth": 0}, {"key": "c296e88117bef515bd9b36ad560223df3fd2b84c", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.06418264450635729, "ground_truth": 0}, {"key": "c296e88117bef515bd9b36ad560223df3fd2b84c", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.12940273645488687, "ground_truth": 0}, {"key": "c296e88117bef515bd9b36ad560223df3fd2b84c", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.09807932616569273, "ground_truth": 0}, {"key": "c5e11ee4c2f0ae511bd0e1fae2978d070b1efc15", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.09401018294656463, "ground_truth": 0}, {"key": "c5e11ee4c2f0ae511bd0e1fae2978d070b1efc15", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.0894546025831515, "ground_truth": 0}, {"key": "c5e11ee4c2f0ae511bd0e1fae2978d070b1efc15", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.04434857961575062, "ground_truth": 0}, {"key": "c5e11ee4c2f0ae511bd0e1fae2978d070b1efc15", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.1666753967288457, "ground_truth": 0}, {"key": "c5e11ee4c2f0ae511bd0e1fae2978d070b1efc15", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.06754669014080195, "ground_truth": 0}, {"key": "1fc2d1ecf1ffdc2f0b642b686e1c21de53a4fd28", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.2337063566368153, "ground_truth": 0}, {"key": "1fc2d1ecf1ffdc2f0b642b686e1c21de53a4fd28", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.12085323625992021, "ground_truth": 0}, {"key": "1fc2d1ecf1ffdc2f0b642b686e1c21de53a4fd28", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.21206880790789254, "ground_truth": 0}, {"key": "1fc2d1ecf1ffdc2f0b642b686e1c21de53a4fd28", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.2509127876924548, "ground_truth": 0}, {"key": "1fc2d1ecf1ffdc2f0b642b686e1c21de53a4fd28", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.31912137531520635, "ground_truth": 0}, {"key": "6556c64821ece8123c130b27285efe9619c3c7fd", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.13028542362289536, "ground_truth": 0}, {"key": "6556c64821ece8123c130b27285efe9619c3c7fd", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.13660839879754036, "ground_truth": 0}, {"key": "6556c64821ece8123c130b27285efe9619c3c7fd", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.6842640181872902, "ground_truth": 0}, {"key": "6556c64821ece8123c130b27285efe9619c3c7fd", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.3998116393459287, "ground_truth": 0}, {"key": "6556c64821ece8123c130b27285efe9619c3c7fd", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.237929908066139, "ground_truth": 0}, {"key": "32ba61f4513f7ec21cedb6ddd2a8a93260f8cd56", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.12506538164501302, "ground_truth": 0}, {"key": "32ba61f4513f7ec21cedb6ddd2a8a93260f8cd56", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.48633152422640585, "ground_truth": 0}, {"key": "32ba61f4513f7ec21cedb6ddd2a8a93260f8cd56", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.36658975002427663, "ground_truth": 0}, {"key": "32ba61f4513f7ec21cedb6ddd2a8a93260f8cd56", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.1907240166684244, "ground_truth": 0}, {"key": "32ba61f4513f7ec21cedb6ddd2a8a93260f8cd56", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.1755380758977278, "ground_truth": 0}, {"key": "1146cfc5981ce23511ac1bac5f3957c30bebc7b8", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.12294379195752321, "ground_truth": 0}, {"key": "1146cfc5981ce23511ac1bac5f3957c30bebc7b8", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.23651624405104194, "ground_truth": 0}, {"key": "1146cfc5981ce23511ac1bac5f3957c30bebc7b8", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.2120688052195621, "ground_truth": 0}, {"key": "1146cfc5981ce23511ac1bac5f3957c30bebc7b8", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.2330075134905935, "ground_truth": 0}, {"key": "1146cfc5981ce23511ac1bac5f3957c30bebc7b8", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.3548800993915584, "ground_truth": 0}, {"key": "e060abdb2a5e2ce6152ca0ed53703a9d17b2df36", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.0994702141970832, "ground_truth": 0}, {"key": "e060abdb2a5e2ce6152ca0ed53703a9d17b2df36", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.4130035642926274, "ground_truth": 0}, {"key": "e060abdb2a5e2ce6152ca0ed53703a9d17b2df36", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.09947020488496514, "ground_truth": 0}, {"key": "e060abdb2a5e2ce6152ca0ed53703a9d17b2df36", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.07585818113835564, "ground_truth": 0}, {"key": "e060abdb2a5e2ce6152ca0ed53703a9d17b2df36", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.09602549631421495, "ground_truth": 0}, {"key": "aef2a80ff67e87a8c165a481ede2a643128f4aa7", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.7563575461877984, "ground_truth": 0}, {"key": "aef2a80ff67e87a8c165a481ede2a643128f4aa7", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.7779753380996163, "ground_truth": 0}, {"key": "aef2a80ff67e87a8c165a481ede2a643128f4aa7", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.8444090117275512, "ground_truth": 0}, {"key": "aef2a80ff67e87a8c165a481ede2a643128f4aa7", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.821044093928524, "ground_truth": 0}, {"key": "aef2a80ff67e87a8c165a481ede2a643128f4aa7", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.6270381507692535, "ground_truth": 0}, {"key": "d4eaedd7f1055f95e9cafa21e870d049f5df8526", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.09401017929973156, "ground_truth": 0}, {"key": "d4eaedd7f1055f95e9cafa21e870d049f5df8526", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.16995623066792817, "ground_truth": 0}, {"key": "d4eaedd7f1055f95e9cafa21e870d049f5df8526", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.13799647921388533, "ground_truth": 0}, {"key": "d4eaedd7f1055f95e9cafa21e870d049f5df8526", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.11008787886273608, "ground_truth": 0}, {"key": "d4eaedd7f1055f95e9cafa21e870d049f5df8526", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.25091278032458536, "ground_truth": 0}, {"key": "ec9531cd58e385f0da60e23b2855a3c5ece3f270", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.08035746091495455, "ground_truth": 0}, {"key": "ec9531cd58e385f0da60e23b2855a3c5ece3f270", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.03185885673979036, "ground_truth": 0}, {"key": "ec9531cd58e385f0da60e23b2855a3c5ece3f270", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.010091315272280356, "ground_truth": 0}, {"key": "ec9531cd58e385f0da60e23b2855a3c5ece3f270", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.03044435084646187, "ground_truth": 0}, {"key": "ec9531cd58e385f0da60e23b2855a3c5ece3f270", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.01987071523385903, "ground_truth": 0}, {"key": "b171bad51c8ec09118fd553347c41d9301f195ee", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.18242552898947542, "ground_truth": 0}, {"key": "b171bad51c8ec09118fd553347c41d9301f195ee", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.10302442379224229, "ground_truth": 0}, {"key": "b171bad51c8ec09118fd553347c41d9301f195ee", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.12808823947107117, "ground_truth": 0}, {"key": "b171bad51c8ec09118fd553347c41d9301f195ee", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.18242553239840353, "ground_truth": 0}, {"key": "b171bad51c8ec09118fd553347c41d9301f195ee", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.08882028806027263, "ground_truth": 0}, {"key": "1df14bd442bd39ed653aa77a1e77105d4b321db0", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.21933749659333648, "ground_truth": 0}, {"key": "1df14bd442bd39ed653aa77a1e77105d4b321db0", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.29098087242222376, "ground_truth": 0}, {"key": "1df14bd442bd39ed653aa77a1e77105d4b321db0", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.1422318899921336, "ground_truth": 0}, {"key": "1df14bd442bd39ed653aa77a1e77105d4b321db0", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.16398024004969045, "ground_truth": 0}, {"key": "1df14bd442bd39ed653aa77a1e77105d4b321db0", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.16451645383840033, "ground_truth": 0}, {"key": "d4f57e3c18c38696345fb7a3d76a151bb9c5123b", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.04177387939938602, "ground_truth": 0}, {"key": "d4f57e3c18c38696345fb7a3d76a151bb9c5123b", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.06097518582163417, "ground_truth": 0}, {"key": "d4f57e3c18c38696345fb7a3d76a151bb9c5123b", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.10194651993666308, "ground_truth": 0}, {"key": "d4f57e3c18c38696345fb7a3d76a151bb9c5123b", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.06255972815462615, "ground_truth": 0}, {"key": "d4f57e3c18c38696345fb7a3d76a151bb9c5123b", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.07585817937126191, "ground_truth": 0}, {"key": "28bbbf57c580be154f0602cbfe8b63603ef5a3a4", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.6909763042096638, "ground_truth": 0}, {"key": "28bbbf57c580be154f0602cbfe8b63603ef5a3a4", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.36840570342912393, "ground_truth": 0}, {"key": "28bbbf57c580be154f0602cbfe8b63603ef5a3a4", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.4513265095898076, "ground_truth": 0}, {"key": "28bbbf57c580be154f0602cbfe8b63603ef5a3a4", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.5234203546169772, "ground_truth": 0}, {"key": "28bbbf57c580be154f0602cbfe8b63603ef5a3a4", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.6943026792625292, "ground_truth": 0}, {"key": "05850904cabf491c9ab7c0e0d85fd932eb8c0bb0", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.2925952739294426, "ground_truth": 0}, {"key": "05850904cabf491c9ab7c0e0d85fd932eb8c0bb0", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.38861802101939075, "ground_truth": 0}, {"key": "05850904cabf491c9ab7c0e0d85fd932eb8c0bb0", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.7146280317864998, "ground_truth": 0}, {"key": "05850904cabf491c9ab7c0e0d85fd932eb8c0bb0", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.16667540137248368, "ground_truth": 0}, {"key": "05850904cabf491c9ab7c0e0d85fd932eb8c0bb0", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.23510838454582955, "ground_truth": 0}, {"key": "df79c0f955e4ccf51ad45780f865e334d3577bf5", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.038756194012248855, "ground_truth": 0}, {"key": "df79c0f955e4ccf51ad45780f865e334d3577bf5", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.03622005905834994, "ground_truth": 0}, {"key": "df79c0f955e4ccf51ad45780f865e334d3577bf5", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.0069306719565742905, "ground_truth": 0}, {"key": "df79c0f955e4ccf51ad45780f865e334d3577bf5", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.009708476566425138, "ground_truth": 0}, {"key": "df79c0f955e4ccf51ad45780f865e334d3577bf5", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.03138043076787506, "ground_truth": 0}, {"key": "ffb8b9be838da033f6f3383f324d425556723147", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.39420094979476256, "ground_truth": 0}, {"key": "ffb8b9be838da033f6f3383f324d425556723147", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.11357958303762707, "ground_truth": 0}, {"key": "ffb8b9be838da033f6f3383f324d425556723147", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.07696083649831482, "ground_truth": 0}, {"key": "ffb8b9be838da033f6f3383f324d425556723147", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.21601153878674959, "ground_truth": 0}, {"key": "ffb8b9be838da033f6f3383f324d425556723147", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.35577488164568133, "ground_truth": 0}, {"key": "d70dcffc2c07e08cc121d7126ada53dbc479626e", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.04434858066121445, "ground_truth": 0}, {"key": "d70dcffc2c07e08cc121d7126ada53dbc479626e", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.07369627238635497, "ground_truth": 0}, {"key": "d70dcffc2c07e08cc121d7126ada53dbc479626e", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.0875638487358914, "ground_truth": 0}, {"key": "d70dcffc2c07e08cc121d7126ada53dbc479626e", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.0490396190323897, "ground_truth": 0}, {"key": "d70dcffc2c07e08cc121d7126ada53dbc479626e", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.14223188806160622, "ground_truth": 0}, {"key": "4dc0cef39980df6382f9aee5e150e904fe62965e", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.020567095925468206, "ground_truth": 0}, {"key": "4dc0cef39980df6382f9aee5e150e904fe62965e", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.02546808190020633, "ground_truth": 0}, {"key": "4dc0cef39980df6382f9aee5e150e904fe62965e", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.006192990526982975, "ground_truth": 0}, {"key": "4dc0cef39980df6382f9aee5e150e904fe62965e", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.009340024600591789, "ground_truth": 0}, {"key": "4dc0cef39980df6382f9aee5e150e904fe62965e", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.028220985999796635, "ground_truth": 0}, {"key": "6cb082c504e00c93686ff1e9287a84ba13c12b79", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.2186693778192481, "ground_truth": 0}, {"key": "6cb082c504e00c93686ff1e9287a84ba13c12b79", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.7446563459996459, "ground_truth": 0}, {"key": "6cb082c504e00c93686ff1e9287a84ba13c12b79", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.8615382018615033, "ground_truth": 0}, {"key": "6cb082c504e00c93686ff1e9287a84ba13c12b79", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.6513548581757184, "ground_truth": 0}, {"key": "6cb082c504e00c93686ff1e9287a84ba13c12b79", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.6671476532148739, "ground_truth": 0}, {"key": "19fe2a8e0bef37b495afcc83c2f46b60c56039bf", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.011508149238556782, "ground_truth": 0}, {"key": "19fe2a8e0bef37b495afcc83c2f46b60c56039bf", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.07316472298837703, "ground_truth": 0}, {"key": "19fe2a8e0bef37b495afcc83c2f46b60c56039bf", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.007846238782286796, "ground_truth": 0}, {"key": "19fe2a8e0bef37b495afcc83c2f46b60c56039bf", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.0021997981188564006, "ground_truth": 0}, {"key": "19fe2a8e0bef37b495afcc83c2f46b60c56039bf", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.019050898832782846, "ground_truth": 0}, {"key": "503c6aaeaf0e61372a896ebe1fdf2a2492844fe4", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.14318770431729216, "ground_truth": 0}, {"key": "503c6aaeaf0e61372a896ebe1fdf2a2492844fe4", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.23934934632216195, "ground_truth": 0}, {"key": "503c6aaeaf0e61372a896ebe1fdf2a2492844fe4", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.18359363047858832, "ground_truth": 0}, {"key": "503c6aaeaf0e61372a896ebe1fdf2a2492844fe4", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.37937838555966913, "ground_truth": 0}, {"key": "503c6aaeaf0e61372a896ebe1fdf2a2492844fe4", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.2893717124637451, "ground_truth": 0}, {"key": "e4007135fdafe84907e2b018da3a4c7ab853c251", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.013795364014087909, "ground_truth": 0}, {"key": "e4007135fdafe84907e2b018da3a4c7ab853c251", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.025565213379803393, "ground_truth": 0}, {"key": "e4007135fdafe84907e2b018da3a4c7ab853c251", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.04084571640356988, "ground_truth": 0}, {"key": "e4007135fdafe84907e2b018da3a4c7ab853c251", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.00831577901894803, "ground_truth": 0}, {"key": "e4007135fdafe84907e2b018da3a4c7ab853c251", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.016215031498718366, "ground_truth": 0}, {"key": "5b97a507eed113ce329e8c85078fb53033bbe567", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.17781086207059793, "ground_truth": 0}, {"key": "5b97a507eed113ce329e8c85078fb53033bbe567", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.12506538821919855, "ground_truth": 0}, {"key": "5b97a507eed113ce329e8c85078fb53033bbe567", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.13846179488655896, "ground_truth": 0}, {"key": "5b97a507eed113ce329e8c85078fb53033bbe567", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.07423137098019363, "ground_truth": 0}, {"key": "5b97a507eed113ce329e8c85078fb53033bbe567", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.142231880425859, "ground_truth": 0}, {"key": "145a118e355e3a92383b41307a5b473a7c77a8bb", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.008511302700089332, "ground_truth": 0}, {"key": "145a118e355e3a92383b41307a5b473a7c77a8bb", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.006930671626557598, "ground_truth": 0}, {"key": "145a118e355e3a92383b41307a5b473a7c77a8bb", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.015723990720871453, "ground_truth": 0}, {"key": "145a118e355e3a92383b41307a5b473a7c77a8bb", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.0037362205668347607, "ground_truth": 0}, {"key": "145a118e355e3a92383b41307a5b473a7c77a8bb", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.004331501830548968, "ground_truth": 0}, {"key": "1f6309c88c5711b2b579e3c0cf699c44d3b56d16", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.2523840444565773, "ground_truth": 0}, {"key": "1f6309c88c5711b2b579e3c0cf699c44d3b56d16", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.2553436345374145, "ground_truth": 0}, {"key": "1f6309c88c5711b2b579e3c0cf699c44d3b56d16", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.0656048326473596, "ground_truth": 0}, {"key": "1f6309c88c5711b2b579e3c0cf699c44d3b56d16", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.21337716505365228, "ground_truth": 0}, {"key": "1f6309c88c5711b2b579e3c0cf699c44d3b56d16", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.048136770362863894, "ground_truth": 0}, {"key": "d8304c60e76a4b16053e74c50abd886dcdf7397c", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.14608724261673384, "ground_truth": 0}, {"key": "d8304c60e76a4b16053e74c50abd886dcdf7397c", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.15713685057656243, "ground_truth": 0}, {"key": "d8304c60e76a4b16053e74c50abd886dcdf7397c", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.3293917081603228, "ground_truth": 0}, {"key": "d8304c60e76a4b16053e74c50abd886dcdf7397c", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.031143831268997196, "ground_truth": 0}, {"key": "d8304c60e76a4b16053e74c50abd886dcdf7397c", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.038178275549542076, "ground_truth": 0}, {"key": "d47e5724a866cf365428dbded7740555e5f80f2b", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.06097518144411574, "ground_truth": 0}, {"key": "d47e5724a866cf365428dbded7740555e5f80f2b", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.23231015123924134, "ground_truth": 0}, {"key": "d47e5724a866cf365428dbded7740555e5f80f2b", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.059866416502654674, "ground_truth": 0}, {"key": "d47e5724a866cf365428dbded7740555e5f80f2b", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.019050898665462734, "ground_truth": 0}, {"key": "d47e5724a866cf365428dbded7740555e5f80f2b", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.12168575278439349, "ground_truth": 0}, {"key": "0a078513cee66db2ccaaca1b7b0755c96f0c5c8a", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.15507848219957543, "ground_truth": 0}, {"key": "0a078513cee66db2ccaaca1b7b0755c96f0c5c8a", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.14223188858570734, "ground_truth": 0}, {"key": "0a078513cee66db2ccaaca1b7b0755c96f0c5c8a", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.10970576995876362, "ground_truth": 0}, {"key": "0a078513cee66db2ccaaca1b7b0755c96f0c5c8a", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.08093671433836258, "ground_truth": 0}, {"key": "0a078513cee66db2ccaaca1b7b0755c96f0c5c8a", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.16776334505008653, "ground_truth": 0}, {"key": "f0d93bdd383762936746b48f7e67ffe72cfb1ede", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.08389038875098866, "ground_truth": 0}, {"key": "f0d93bdd383762936746b48f7e67ffe72cfb1ede", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.22953521925859757, "ground_truth": 0}, {"key": "f0d93bdd383762936746b48f7e67ffe72cfb1ede", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.0815197537954087, "ground_truth": 0}, {"key": "f0d93bdd383762936746b48f7e67ffe72cfb1ede", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.06608537317566954, "ground_truth": 0}, {"key": "f0d93bdd383762936746b48f7e67ffe72cfb1ede", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.04451442861375948, "ground_truth": 0}, {"key": "38649fdccec39afa649297349b2ad2e5e1a39d82", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.3849121599738037, "ground_truth": 0}, {"key": "38649fdccec39afa649297349b2ad2e5e1a39d82", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.795022277495991, "ground_truth": 0}, {"key": "38649fdccec39afa649297349b2ad2e5e1a39d82", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.47657965515622097, "ground_truth": 0}, {"key": "38649fdccec39afa649297349b2ad2e5e1a39d82", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.5273165159563561, "ground_truth": 0}, {"key": "38649fdccec39afa649297349b2ad2e5e1a39d82", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.5602526535254755, "ground_truth": 0}, {"key": "d86d9a4e0b39556578f24ff54ed82716f0375fdb", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.1571368478687646, "ground_truth": 0}, {"key": "d86d9a4e0b39556578f24ff54ed82716f0375fdb", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.2925953220113264, "ground_truth": 0}, {"key": "d86d9a4e0b39556578f24ff54ed82716f0375fdb", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.22270013988498238, "ground_truth": 0}, {"key": "d86d9a4e0b39556578f24ff54ed82716f0375fdb", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.195594078455348, "ground_truth": 0}, {"key": "d86d9a4e0b39556578f24ff54ed82716f0375fdb", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.5234203602897456, "ground_truth": 0}, {"key": "d10d57811499caa54276d3e14f89c45cb1a8958f", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.05707139842720544, "ground_truth": 0}, {"key": "d10d57811499caa54276d3e14f89c45cb1a8958f", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.08329192795956629, "ground_truth": 0}, {"key": "d10d57811499caa54276d3e14f89c45cb1a8958f", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.15974101930247178, "ground_truth": 0}, {"key": "d10d57811499caa54276d3e14f89c45cb1a8958f", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.0750407200236922, "ground_truth": 0}, {"key": "d10d57811499caa54276d3e14f89c45cb1a8958f", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.2814056184001673, "ground_truth": 0}, {"key": "66646c49afb65308491ec8ca6db79aa76263cc69", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.027169230498059933, "ground_truth": 0}, {"key": "66646c49afb65308491ec8ca6db79aa76263cc69", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.044348579624261704, "ground_truth": 0}, {"key": "66646c49afb65308491ec8ca6db79aa76263cc69", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.11085559332359163, "ground_truth": 0}, {"key": "66646c49afb65308491ec8ca6db79aa76263cc69", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.02546808226936481, "ground_truth": 0}, {"key": "66646c49afb65308491ec8ca6db79aa76263cc69", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.07558478077967759, "ground_truth": 0}, {"key": "7fbd6d867def06f6ae4c051562dc36ab8d0038c0", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.49218811491608183, "ground_truth": 0}, {"key": "7fbd6d867def06f6ae4c051562dc36ab8d0038c0", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.3468730970589257, "ground_truth": 0}, {"key": "7fbd6d867def06f6ae4c051562dc36ab8d0038c0", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.2814056005892906, "ground_truth": 0}, {"key": "7fbd6d867def06f6ae4c051562dc36ab8d0038c0", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.3090237018228317, "ground_truth": 0}, {"key": "7fbd6d867def06f6ae4c051562dc36ab8d0038c0", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.18242552284237612, "ground_truth": 0}, {"key": "5c243b51bf4de7f6974338d71ac26317254007bb", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.2814056046025696, "ground_truth": 0}, {"key": "5c243b51bf4de7f6974338d71ac26317254007bb", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.2240554639618365, "ground_truth": 0}, {"key": "5c243b51bf4de7f6974338d71ac26317254007bb", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.2553436558030236, "ground_truth": 0}, {"key": "5c243b51bf4de7f6974338d71ac26317254007bb", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.2043419059190331, "ground_truth": 0}, {"key": "5c243b51bf4de7f6974338d71ac26317254007bb", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.12765261751381263, "ground_truth": 0}, {"key": "56b79c03a77d5261382e4705f3537396473f55cf", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.3557748688284663, "ground_truth": 0}, {"key": "56b79c03a77d5261382e4705f3537396473f55cf", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.4282333997567522, "ground_truth": 0}, {"key": "56b79c03a77d5261382e4705f3537396473f55cf", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.6601723741280022, "ground_truth": 0}, {"key": "56b79c03a77d5261382e4705f3537396473f55cf", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.6757646048236331, "ground_truth": 0}, {"key": "56b79c03a77d5261382e4705f3537396473f55cf", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.45713673964221924, "ground_truth": 0}, {"key": "7382d171d71d3219c5ad0a13ea0ac92ac6b6998b", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.17441027796633296, "ground_truth": 0}, {"key": "7382d171d71d3219c5ad0a13ea0ac92ac6b6998b", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.02002344081310921, "ground_truth": 0}, {"key": "7382d171d71d3219c5ad0a13ea0ac92ac6b6998b", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.038178275711979445, "ground_truth": 0}, {"key": "7382d171d71d3219c5ad0a13ea0ac92ac6b6998b", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.0888202929055101, "ground_truth": 0}, {"key": "7382d171d71d3219c5ad0a13ea0ac92ac6b6998b", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.060307632291997856, "ground_truth": 0}, {"key": "ef1a5fa8dbba16e4d7ef3fc8cd540c2f55691fc8", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.47657964630850025, "ground_truth": 0}, {"key": "ef1a5fa8dbba16e4d7ef3fc8cd540c2f55691fc8", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.7745833851504809, "ground_truth": 0}, {"key": "ef1a5fa8dbba16e4d7ef3fc8cd540c2f55691fc8", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.6001883350957882, "ground_truth": 0}, {"key": "ef1a5fa8dbba16e4d7ef3fc8cd540c2f55691fc8", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.7041601401062121, "ground_truth": 0}, {"key": "ef1a5fa8dbba16e4d7ef3fc8cd540c2f55691fc8", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.6424324824658669, "ground_truth": 0}, {"key": "1ba0f66a7f4f23171634a3455893f4d5b8b94db4", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.5039061476796184, "ground_truth": 0}, {"key": "1ba0f66a7f4f23171634a3455893f4d5b8b94db4", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.19436782122630222, "ground_truth": 0}, {"key": "1ba0f66a7f4f23171634a3455893f4d5b8b94db4", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.575588007031821, "ground_truth": 0}, {"key": "1ba0f66a7f4f23171634a3455893f4d5b8b94db4", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.620621609957643, "ground_truth": 0}, {"key": "1ba0f66a7f4f23171634a3455893f4d5b8b94db4", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.12421301087726434, "ground_truth": 0}, {"key": "3131e8ba238a31d83cad00bc7b02933b0a3587b3", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.00305151012797917, "ground_truth": 0}, {"key": "3131e8ba238a31d83cad00bc7b02933b0a3587b3", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.006930671626557598, "ground_truth": 0}, {"key": "3131e8ba238a31d83cad00bc7b02933b0a3587b3", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.0037948339193419733, "ground_truth": 0}, {"key": "3131e8ba238a31d83cad00bc7b02933b0a3587b3", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.0037362205668347607, "ground_truth": 0}, {"key": "3131e8ba238a31d83cad00bc7b02933b0a3587b3", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.004331501830548968, "ground_truth": 0}, {"key": "112bc4ab4b6e7d6dd35fc33cd946fbfc4c9356d6", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.17328820398007735, "ground_truth": 0}, {"key": "112bc4ab4b6e7d6dd35fc33cd946fbfc4c9356d6", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.4416730050606239, "ground_truth": 0}, {"key": "112bc4ab4b6e7d6dd35fc33cd946fbfc4c9356d6", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.511716594725156, "ground_truth": 0}, {"key": "112bc4ab4b6e7d6dd35fc33cd946fbfc4c9356d6", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.16238002401448112, "ground_truth": 0}, {"key": "112bc4ab4b6e7d6dd35fc33cd946fbfc4c9356d6", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.17610412693274186, "ground_truth": 0}, {"key": "3b1d3309825780556178569cd40d880a793f8da7", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.27982850609161614, "ground_truth": 0}, {"key": "3b1d3309825780556178569cd40d880a793f8da7", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.3593641512763388, "ground_truth": 0}, {"key": "3b1d3309825780556178569cd40d880a793f8da7", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.23792990336713143, "ground_truth": 0}, {"key": "3b1d3309825780556178569cd40d880a793f8da7", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.1389284249148848, "ground_truth": 0}, {"key": "3b1d3309825780556178569cd40d880a793f8da7", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.22270013653861911, "ground_truth": 0}, {"key": "c977693b405a89cec98e53b05199e608fd6adeca", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.034358688032151065, "ground_truth": 0}, {"key": "c977693b405a89cec98e53b05199e608fd6adeca", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.08756383985486633, "ground_truth": 0}, {"key": "c977693b405a89cec98e53b05199e608fd6adeca", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.019568676821857454, "ground_truth": 0}, {"key": "c977693b405a89cec98e53b05199e608fd6adeca", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.019643761026202508, "ground_truth": 0}, {"key": "c977693b405a89cec98e53b05199e608fd6adeca", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.17781087046458555, "ground_truth": 0}, {"key": "c84e272a80fa95f863e016bc54df0841fd83fc12", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.04885778101800598, "ground_truth": 0}, {"key": "c84e272a80fa95f863e016bc54df0841fd83fc12", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.08632347628391883, "ground_truth": 0}, {"key": "c84e272a80fa95f863e016bc54df0841fd83fc12", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.974434788035595, "ground_truth": 0}, {"key": "c84e272a80fa95f863e016bc54df0841fd83fc12", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.024987793449838546, "ground_truth": 0}, {"key": "c84e272a80fa95f863e016bc54df0841fd83fc12", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.07263670432493079, "ground_truth": 0}, {"key": "f51cff1d73cd0f3954376d7b3eab1d5b2ccb354c", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.23370634606036045, "ground_truth": 0}, {"key": "f51cff1d73cd0f3954376d7b3eab1d5b2ccb354c", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.4726834800581398, "ground_truth": 0}, {"key": "f51cff1d73cd0f3954376d7b3eab1d5b2ccb354c", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.15203224957635694, "ground_truth": 0}, {"key": "f51cff1d73cd0f3954376d7b3eab1d5b2ccb354c", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.2613309316170495, "ground_truth": 0}, {"key": "f51cff1d73cd0f3954376d7b3eab1d5b2ccb354c", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.1285251271468155, "ground_truth": 0}, {"key": "a98f1a0258f641788e570264b79e5c816f80054f", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.06979491863157242, "ground_truth": 0}, {"key": "a98f1a0258f641788e570264b79e5c816f80054f", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.12506538691753183, "ground_truth": 0}, {"key": "a98f1a0258f641788e570264b79e5c816f80054f", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.03649376751018872, "ground_truth": 0}, {"key": "a98f1a0258f641788e570264b79e5c816f80054f", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.1847675050037572, "ground_truth": 0}, {"key": "a98f1a0258f641788e570264b79e5c816f80054f", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.1460872453091135, "ground_truth": 0}, {"key": "d69d50059c96bd729e9e4c54eee7901d43c0181d", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.3451052838778332, "ground_truth": 0}, {"key": "d69d50059c96bd729e9e4c54eee7901d43c0181d", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.5477060089291581, "ground_truth": 0}, {"key": "d69d50059c96bd729e9e4c54eee7901d43c0181d", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.16667539296274334, "ground_truth": 0}, {"key": "d69d50059c96bd729e9e4c54eee7901d43c0181d", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.269710141292564, "ground_truth": 0}, {"key": "d69d50059c96bd729e9e4c54eee7901d43c0181d", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.4035668651992639, "ground_truth": 0}, {"key": "379692c378381f092c0bae0516ea8abc5bdb98b8", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.02315340933723184, "ground_truth": 0}, {"key": "379692c378381f092c0bae0516ea8abc5bdb98b8", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.14608725082175766, "ground_truth": 0}, {"key": "379692c378381f092c0bae0516ea8abc5bdb98b8", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.03461883909101606, "ground_truth": 0}, {"key": "379692c378381f092c0bae0516ea8abc5bdb98b8", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.031858856126753855, "ground_truth": 0}, {"key": "379692c378381f092c0bae0516ea8abc5bdb98b8", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.02595735646905307, "ground_truth": 0}, {"key": "88b0d86cd06cd05a090f6a6c3a3ed17bf5f96df3", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.3904758266102798, "ground_truth": 0}, {"key": "88b0d86cd06cd05a090f6a6c3a3ed17bf5f96df3", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.292595309497282, "ground_truth": 0}, {"key": "88b0d86cd06cd05a090f6a6c3a3ed17bf5f96df3", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.48633152969693133, "ground_truth": 0}, {"key": "88b0d86cd06cd05a090f6a6c3a3ed17bf5f96df3", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.29583986160086945, "ground_truth": 0}, {"key": "88b0d86cd06cd05a090f6a6c3a3ed17bf5f96df3", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.18359364005999823, "ground_truth": 0}, {"key": "3b46e80db81819fdcb8b8044941f64d0fa5abd11", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.041152885496494714, "ground_truth": 0}, {"key": "3b46e80db81819fdcb8b8044941f64d0fa5abd11", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.00934002439908321, "ground_truth": 0}, {"key": "3b46e80db81819fdcb8b8044941f64d0fa5abd11", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.004248079445186411, "ground_truth": 0}, {"key": "3b46e80db81819fdcb8b8044941f64d0fa5abd11", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.03010033575277447, "ground_truth": 0}, {"key": "3b46e80db81819fdcb8b8044941f64d0fa5abd11", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.0024438865600090553, "ground_truth": 0}, {"key": "786d56f09dae2902696b680395353986051a1139", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.22067816331145548, "ground_truth": 0}, {"key": "786d56f09dae2902696b680395353986051a1139", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.12808824004472324, "ground_truth": 0}, {"key": "786d56f09dae2902696b680395353986051a1139", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.17667161394274633, "ground_truth": 0}, {"key": "786d56f09dae2902696b680395353986051a1139", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.20181321827610937, "ground_truth": 0}, {"key": "786d56f09dae2902696b680395353986051a1139", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.20817893574706697, "ground_truth": 0}, {"key": "bf1a3fd65fdd6e91ccec0663d80fa567eada14df", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.1163617719566744, "ground_truth": 0}, {"key": "bf1a3fd65fdd6e91ccec0663d80fa567eada14df", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.2465333376051654, "ground_truth": 0}, {"key": "bf1a3fd65fdd6e91ccec0663d80fa567eada14df", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.03904828946529562, "ground_truth": 0}, {"key": "bf1a3fd65fdd6e91ccec0663d80fa567eada14df", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.1520322459249004, "ground_truth": 0}, {"key": "bf1a3fd65fdd6e91ccec0663d80fa567eada14df", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.08122775863664032, "ground_truth": 0}, {"key": "a0bd3047a6de80e3924843f1961ce28347c6a548", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.13386748357739833, "ground_truth": 0}, {"key": "a0bd3047a6de80e3924843f1961ce28347c6a548", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.020410306703242568, "ground_truth": 0}, {"key": "a0bd3047a6de80e3924843f1961ce28347c6a548", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.01711089047478384, "ground_truth": 0}, {"key": "a0bd3047a6de80e3924843f1961ce28347c6a548", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.028114056296913516, "ground_truth": 0}, {"key": "a0bd3047a6de80e3924843f1961ce28347c6a548", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.018617801326144448, "ground_truth": 0}, {"key": "090d322e93af624203dbd5dc83403170071c9e6a", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.33111973539690376, "ground_truth": 0}, {"key": "090d322e93af624203dbd5dc83403170071c9e6a", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.25386100429388386, "ground_truth": 0}, {"key": "090d322e93af624203dbd5dc83403170071c9e6a", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.418696921561847, "ground_truth": 0}, {"key": "090d322e93af624203dbd5dc83403170071c9e6a", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.22000710163064227, "ground_truth": 0}, {"key": "090d322e93af624203dbd5dc83403170071c9e6a", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.41679664924853815, "ground_truth": 0}, {"key": "ed5179817cb8f597a760800fcdce2b8e64fd30dc", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.1824255253291146, "ground_truth": 0}, {"key": "ed5179817cb8f597a760800fcdce2b8e64fd30dc", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.3504213723121259, "ground_truth": 0}, {"key": "ed5179817cb8f597a760800fcdce2b8e64fd30dc", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.25386101345538886, "ground_truth": 0}, {"key": "ed5179817cb8f597a760800fcdce2b8e64fd30dc", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.12002562937635354, "ground_truth": 0}, {"key": "ed5179817cb8f597a760800fcdce2b8e64fd30dc", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.14033624762244148, "ground_truth": 0}, {"key": "571a8023d0deed8c667dd41fed88290309e56927", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.078078164886264, "ground_truth": 0}, {"key": "571a8023d0deed8c667dd41fed88290309e56927", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.18242552755402736, "ground_truth": 0}, {"key": "571a8023d0deed8c667dd41fed88290309e56927", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.4359015210725666, "ground_truth": 0}, {"key": "571a8023d0deed8c667dd41fed88290309e56927", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.16776334890272462, "ground_truth": 0}, {"key": "571a8023d0deed8c667dd41fed88290309e56927", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.18476750110228973, "ground_truth": 0}, {"key": "544d7c0cba7df38cc8dda8d0d91c6845cf5f52bb", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.12002563578023707, "ground_truth": 0}, {"key": "544d7c0cba7df38cc8dda8d0d91c6845cf5f52bb", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.15203224564254667, "ground_truth": 0}, {"key": "544d7c0cba7df38cc8dda8d0d91c6845cf5f52bb", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.23510838918347807, "ground_truth": 0}, {"key": "544d7c0cba7df38cc8dda8d0d91c6845cf5f52bb", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.23934933930833083, "ground_truth": 0}, {"key": "544d7c0cba7df38cc8dda8d0d91c6845cf5f52bb", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.15713685414124837, "ground_truth": 0}, {"key": "cbd3a0715a91ac8f651aa7b1f2c1fb37a2ef8a69", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.04038906825742198, "ground_truth": 0}, {"key": "cbd3a0715a91ac8f651aa7b1f2c1fb37a2ef8a69", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.14318769964391767, "ground_truth": 0}, {"key": "cbd3a0715a91ac8f651aa7b1f2c1fb37a2ef8a69", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.07640768320790968, "ground_truth": 0}, {"key": "cbd3a0715a91ac8f651aa7b1f2c1fb37a2ef8a69", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.07723878084320634, "ground_truth": 0}, {"key": "cbd3a0715a91ac8f651aa7b1f2c1fb37a2ef8a69", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.08329192700655437, "ground_truth": 0}, {"key": "4ca8b3cf75948dffea7b96e71bf1d9621107354b", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.6825737308439439, "ground_truth": 0}, {"key": "4ca8b3cf75948dffea7b96e71bf1d9621107354b", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.6057990617633404, "ground_truth": 0}, {"key": "4ca8b3cf75948dffea7b96e71bf1d9621107354b", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.2523840518043966, "ground_truth": 0}, {"key": "4ca8b3cf75948dffea7b96e71bf1d9621107354b", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.5, "ground_truth": 0}, {"key": "4ca8b3cf75948dffea7b96e71bf1d9621107354b", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.4941408956355492, "ground_truth": 0}, {"key": "98f04e49605f36e0236b206fcb26a1549a7c00c6", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.026155618822644732, "ground_truth": 0}, {"key": "98f04e49605f36e0236b206fcb26a1549a7c00c6", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.0530097698578119, "ground_truth": 0}, {"key": "98f04e49605f36e0236b206fcb26a1549a7c00c6", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.0677931379777811, "ground_truth": 0}, {"key": "98f04e49605f36e0236b206fcb26a1549a7c00c6", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.023689471712378247, "ground_truth": 0}, {"key": "98f04e49605f36e0236b206fcb26a1549a7c00c6", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.0780781610017613, "ground_truth": 0}, {"key": "fb0003754a764d7f3252120de58b515d1f882556", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.05749327901188097, "ground_truth": 0}, {"key": "fb0003754a764d7f3252120de58b515d1f882556", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.10669059806089891, "ground_truth": 0}, {"key": "fb0003754a764d7f3252120de58b515d1f882556", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.06681232490028681, "ground_truth": 0}, {"key": "fb0003754a764d7f3252120de58b515d1f882556", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.06903792897868426, "ground_truth": 0}, {"key": "fb0003754a764d7f3252120de58b515d1f882556", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.05623634729447621, "ground_truth": 0}, {"key": "0130f10c1d700cf42cad5fd24b242667342c86be", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.5448014085968099, "ground_truth": 0}, {"key": "0130f10c1d700cf42cad5fd24b242667342c86be", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.45326186419931425, "ground_truth": 0}, {"key": "0130f10c1d700cf42cad5fd24b242667342c86be", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.7534666605026501, "ground_truth": 0}, {"key": "0130f10c1d700cf42cad5fd24b242667342c86be", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.17106119246147347, "ground_truth": 0}, {"key": "0130f10c1d700cf42cad5fd24b242667342c86be", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.6352224298836102, "ground_truth": 0}, {"key": "fb8431bc320c2c1a6c32699da0fdae228ed8d73b", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.04637820473087467, "ground_truth": 0}, {"key": "fb8431bc320c2c1a6c32699da0fdae228ed8d73b", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.0427221944206837, "ground_truth": 0}, {"key": "fb8431bc320c2c1a6c32699da0fdae228ed8d73b", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.01784873735440922, "ground_truth": 0}, {"key": "fb8431bc320c2c1a6c32699da0fdae228ed8d73b", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.1490352934492752, "ground_truth": 0}, {"key": "fb8431bc320c2c1a6c32699da0fdae228ed8d73b", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.011552671320876746, "ground_truth": 0}, {"key": "875d564015e85f88103edf0b36ce10e292334902", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.04742587239489459, "ground_truth": 0}, {"key": "875d564015e85f88103edf0b36ce10e292334902", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.08945460324849475, "ground_truth": 0}, {"key": "875d564015e85f88103edf0b36ce10e292334902", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.108945038377831, "ground_truth": 0}, {"key": "875d564015e85f88103edf0b36ce10e292334902", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.013848611023352225, "ground_truth": 0}, {"key": "875d564015e85f88103edf0b36ce10e292334902", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.09670578469228257, "ground_truth": 0}, {"key": "53102b470b50905c033a90940fc6fa87190f7343", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.5409238392656327, "ground_truth": 0}, {"key": "53102b470b50905c033a90940fc6fa87190f7343", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.27048023783677094, "ground_truth": 0}, {"key": "53102b470b50905c033a90940fc6fa87190f7343", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.5746334771456261, "ground_truth": 0}, {"key": "53102b470b50905c033a90940fc6fa87190f7343", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.13477590962518382, "ground_truth": 0}, {"key": "53102b470b50905c033a90940fc6fa87190f7343", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.2056150398877604, "ground_truth": 0}, {"key": "58776b77856719aff45f09e50d370f52c756dc10", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.1015894492537793, "ground_truth": 0}, {"key": "58776b77856719aff45f09e50d370f52c756dc10", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.07921031989341994, "ground_truth": 0}, {"key": "58776b77856719aff45f09e50d370f52c756dc10", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.037467510035967676, "ground_truth": 0}, {"key": "58776b77856719aff45f09e50d370f52c756dc10", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.15152935033282255, "ground_truth": 0}, {"key": "58776b77856719aff45f09e50d370f52c756dc10", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.1677633472506686, "ground_truth": 0}, {"key": "1b1479bb6e290e86e4b2a1e862e06909a0a62f8e", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.4571367302479083, "ground_truth": 0}, {"key": "1b1479bb6e290e86e4b2a1e862e06909a0a62f8e", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.8714748679817677, "ground_truth": 0}, {"key": "1b1479bb6e290e86e4b2a1e862e06909a0a62f8e", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.9804313231088617, "ground_truth": 0}, {"key": "1b1479bb6e290e86e4b2a1e862e06909a0a62f8e", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.3886180156720463, "ground_truth": 0}, {"key": "1b1479bb6e290e86e4b2a1e862e06909a0a62f8e", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.5234203442380025, "ground_truth": 0}, {"key": "137019bb8262f8ab776ec6367a0ae4b020fa638e", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.18184364635442138, "ground_truth": 0}, {"key": "137019bb8262f8ab776ec6367a0ae4b020fa638e", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.31237002342829523, "ground_truth": 0}, {"key": "137019bb8262f8ab776ec6367a0ae4b020fa638e", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.3629692036920446, "ground_truth": 0}, {"key": "137019bb8262f8ab776ec6367a0ae4b020fa638e", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.10411241303576933, "ground_truth": 0}, {"key": "137019bb8262f8ab776ec6367a0ae4b020fa638e", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.23091976450236426, "ground_truth": 0}, {"key": "1f738e018a3a193d04ec22612e4fe6b01b4969fe", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.3486451403306872, "ground_truth": 0}, {"key": "1f738e018a3a193d04ec22612e4fe6b01b4969fe", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.1403362580843833, "ground_truth": 0}, {"key": "1f738e018a3a193d04ec22612e4fe6b01b4969fe", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.21011726604146536, "ground_truth": 0}, {"key": "1f738e018a3a193d04ec22612e4fe6b01b4969fe", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.27669054024883266, "ground_truth": 0}, {"key": "1f738e018a3a193d04ec22612e4fe6b01b4969fe", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.6636689659801034, "ground_truth": 0}, {"key": "2bb7b7d5a229ccb9c9b5b4fa1475a54297fc0a25", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.34334175071798945, "ground_truth": 0}, {"key": "2bb7b7d5a229ccb9c9b5b4fa1475a54297fc0a25", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.23370635465679238, "ground_truth": 0}, {"key": "2bb7b7d5a229ccb9c9b5b4fa1475a54297fc0a25", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.14608725497969463, "ground_truth": 0}, {"key": "2bb7b7d5a229ccb9c9b5b4fa1475a54297fc0a25", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.1968262081991762, "ground_truth": 0}, {"key": "2bb7b7d5a229ccb9c9b5b4fa1475a54297fc0a25", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.3757064393195301, "ground_truth": 0}, {"key": "c136c209869b227e534aca60b6df7e0b26bce7fe", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.07159120093145388, "ground_truth": 0}, {"key": "c136c209869b227e534aca60b6df7e0b26bce7fe", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.08787643426911311, "ground_truth": 0}, {"key": "c136c209869b227e534aca60b6df7e0b26bce7fe", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.029312232267230606, "ground_truth": 0}, {"key": "c136c209869b227e534aca60b6df7e0b26bce7fe", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.08151975595431929, "ground_truth": 0}, {"key": "c136c209869b227e534aca60b6df7e0b26bce7fe", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.047780070380139185, "ground_truth": 0}, {"key": "bfbf2be3d5b9da8425253502393528d0f95d2b5d", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.8587185806218903, "ground_truth": 0}, {"key": "bfbf2be3d5b9da8425253502393528d0f95d2b5d", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.6495786211445337, "ground_truth": 0}, {"key": "bfbf2be3d5b9da8425253502393528d0f95d2b5d", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.3090237030634627, "ground_truth": 0}, {"key": "bfbf2be3d5b9da8425253502393528d0f95d2b5d", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.39233683878567566, "ground_truth": 0}, {"key": "bfbf2be3d5b9da8425253502393528d0f95d2b5d", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.49414089533286737, "ground_truth": 0}, {"key": "de149988c9768a12f4a656f1d86efe42af51b4c8", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.19682620232714285, "ground_truth": 0}, {"key": "de149988c9768a12f4a656f1d86efe42af51b4c8", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.3812195791955098, "ground_truth": 0}, {"key": "de149988c9768a12f4a656f1d86efe42af51b4c8", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.6513548599548368, "ground_truth": 0}, {"key": "de149988c9768a12f4a656f1d86efe42af51b4c8", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.4339814840942197, "ground_truth": 0}, {"key": "de149988c9768a12f4a656f1d86efe42af51b4c8", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.5888891438694615, "ground_truth": 0}, {"key": "45986f43dd61461844801c08c8753a71ccbf9083", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.46295861736925686, "ground_truth": 0}, {"key": "45986f43dd61461844801c08c8753a71ccbf9083", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.0627892051469907, "ground_truth": 0}, {"key": "45986f43dd61461844801c08c8753a71ccbf9083", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.0641826414063455, "ground_truth": 0}, {"key": "45986f43dd61461844801c08c8753a71ccbf9083", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.05728197093926702, "ground_truth": 0}, {"key": "45986f43dd61461844801c08c8753a71ccbf9083", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.2005576754846521, "ground_truth": 0}, {"key": "e27256e1314f48219ceca70c273dd8429fc4ca4f", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.10743747194026938, "ground_truth": 0}, {"key": "e27256e1314f48219ceca70c273dd8429fc4ca4f", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.04352814298273277, "ground_truth": 0}, {"key": "e27256e1314f48219ceca70c273dd8429fc4ca4f", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.06187598485572171, "ground_truth": 0}, {"key": "e27256e1314f48219ceca70c273dd8429fc4ca4f", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.048496003286977146, "ground_truth": 0}, {"key": "e27256e1314f48219ceca70c273dd8429fc4ca4f", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.04867656967102877, "ground_truth": 0}, {"key": "8da9fddf6f4a0d798e454ee7b778ce0d7ce3c447", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.16451646264021436, "ground_truth": 0}, {"key": "8da9fddf6f4a0d798e454ee7b778ce0d7ce3c447", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.14033625250550985, "ground_truth": 0}, {"key": "8da9fddf6f4a0d798e454ee7b778ce0d7ce3c447", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.30569731802124295, "ground_truth": 0}, {"key": "8da9fddf6f4a0d798e454ee7b778ce0d7ce3c447", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.09670578996667444, "ground_truth": 0}, {"key": "8da9fddf6f4a0d798e454ee7b778ce0d7ce3c447", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.13523207864303707, "ground_truth": 0}, {"key": "d2e357c372891291bbdb4f496792ea9d5807cd3a", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.800067891609116, "ground_truth": 0}, {"key": "d2e357c372891291bbdb4f496792ea9d5807cd3a", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.6424324788067629, "ground_truth": 0}, {"key": "d2e357c372891291bbdb4f496792ea9d5807cd3a", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.5312093781285115, "ground_truth": 0}, {"key": "d2e357c372891291bbdb4f496792ea9d5807cd3a", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.8652240769549964, "ground_truth": 0}, {"key": "d2e357c372891291bbdb4f496792ea9d5807cd3a", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.33633102998524744, "ground_truth": 0}, {"key": "2a17cad6a35f54ceab81d03772a75c58aa7147ef", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.04501553100095206, "ground_truth": 0}, {"key": "2a17cad6a35f54ceab81d03772a75c58aa7147ef", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.24077460582954577, "ground_truth": 0}, {"key": "2a17cad6a35f54ceab81d03772a75c58aa7147ef", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.03704716868380644, "ground_truth": 0}, {"key": "2a17cad6a35f54ceab81d03772a75c58aa7147ef", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.041462275339081964, "ground_truth": 0}, {"key": "2a17cad6a35f54ceab81d03772a75c58aa7147ef", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.20434190290963597, "ground_truth": 0}, {"key": "4b25022fda48e7f91ab1459f1a6dca501318672e", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.1480471946181245, "ground_truth": 0}, {"key": "4b25022fda48e7f91ab1459f1a6dca501318672e", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.22135069731024754, "ground_truth": 0}, {"key": "4b25022fda48e7f91ab1459f1a6dca501318672e", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.11757213545684239, "ground_truth": 0}, {"key": "4b25022fda48e7f91ab1459f1a6dca501318672e", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.16451644984187638, "ground_truth": 0}, {"key": "4b25022fda48e7f91ab1459f1a6dca501318672e", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.6601723665712808, "ground_truth": 0}, {"key": "62066d76f4ef9e06a1129551c41371bb5d2f7465", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.5650587477893183, "ground_truth": 0}, {"key": "62066d76f4ef9e06a1129551c41371bb5d2f7465", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.7310585952384661, "ground_truth": 0}, {"key": "62066d76f4ef9e06a1129551c41371bb5d2f7465", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.888372003152826, "ground_truth": 0}, {"key": "62066d76f4ef9e06a1129551c41371bb5d2f7465", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.32939172062356786, "ground_truth": 0}, {"key": "62066d76f4ef9e06a1129551c41371bb5d2f7465", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.36658974161730645, "ground_truth": 0}, {"key": "16c4a27e42066259797d93d5db0239bce0a15f18", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.1451153568873659, "ground_truth": 0}, {"key": "16c4a27e42066259797d93d5db0239bce0a15f18", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.07751765368666984, "ground_truth": 0}, {"key": "16c4a27e42066259797d93d5db0239bce0a15f18", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.0566524244901695, "ground_truth": 0}, {"key": "16c4a27e42066259797d93d5db0239bce0a15f18", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.30074557503384536, "ground_truth": 0}, {"key": "16c4a27e42066259797d93d5db0239bce0a15f18", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.11676401587960224, "ground_truth": 0}, {"key": "8626e8d0c96f4d12eca92423e0c43c6ea3e53545", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.178955890975982, "ground_truth": 0}, {"key": "8626e8d0c96f4d12eca92423e0c43c6ea3e53545", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.10017222648614425, "ground_truth": 0}, {"key": "8626e8d0c96f4d12eca92423e0c43c6ea3e53545", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.2814056030525779, "ground_truth": 0}, {"key": "8626e8d0c96f4d12eca92423e0c43c6ea3e53545", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.2200070968193156, "ground_truth": 0}, {"key": "8626e8d0c96f4d12eca92423e0c43c6ea3e53545", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.3090237068373486, "ground_truth": 0}, {"key": "f675d806e17d1920e6622d3a925367697c94e58e", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.22815650401617957, "ground_truth": 0}, {"key": "f675d806e17d1920e6622d3a925367697c94e58e", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.2114168277479511, "ground_truth": 0}, {"key": "f675d806e17d1920e6622d3a925367697c94e58e", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.23440664760487262, "ground_truth": 0}, {"key": "f675d806e17d1920e6622d3a925367697c94e58e", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.18359362331925239, "ground_truth": 0}, {"key": "f675d806e17d1920e6622d3a925367697c94e58e", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.38121957425318564, "ground_truth": 0}, {"key": "835b6e4637bd2c3fe2644f2cefa00270e950ebdf", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.07807816123776841, "ground_truth": 0}, {"key": "835b6e4637bd2c3fe2644f2cefa00270e950ebdf", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.09877258932519417, "ground_truth": 0}, {"key": "835b6e4637bd2c3fe2644f2cefa00270e950ebdf", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.061649623138883884, "ground_truth": 0}, {"key": "835b6e4637bd2c3fe2644f2cefa00270e950ebdf", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.059210252684634354, "ground_truth": 0}, {"key": "835b6e4637bd2c3fe2644f2cefa00270e950ebdf", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.12940273884700002, "ground_truth": 0}, {"key": "aec90720358f66b9d149db8afd08fbb821e3aa52", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.028436034320688065, "ground_truth": 0}, {"key": "aec90720358f66b9d149db8afd08fbb821e3aa52", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.07807816038294475, "ground_truth": 0}, {"key": "aec90720358f66b9d149db8afd08fbb821e3aa52", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.030214588852742308, "ground_truth": 0}, {"key": "aec90720358f66b9d149db8afd08fbb821e3aa52", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.06278920703025156, "ground_truth": 0}, {"key": "aec90720358f66b9d149db8afd08fbb821e3aa52", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.02790137665870679, "ground_truth": 0}, {"key": "0033829349643e2964a8c3ce5fd997116ce43f7c", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.4282333807682022, "ground_truth": 0}, {"key": "0033829349643e2964a8c3ce5fd997116ce43f7c", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.10230470631582318, "ground_truth": 0}, {"key": "0033829349643e2964a8c3ce5fd997116ce43f7c", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.21733751776397797, "ground_truth": 0}, {"key": "0033829349643e2964a8c3ce5fd997116ce43f7c", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.2120688015036228, "ground_truth": 0}, {"key": "0033829349643e2964a8c3ce5fd997116ce43f7c", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.23792988930822928, "ground_truth": 0}, {"key": "3276a47234f0aa9eb7d4d06940ffb912be059454", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.0067712097892571824, "ground_truth": 0}, {"key": "3276a47234f0aa9eb7d4d06940ffb912be059454", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.00784623913357939, "ground_truth": 0}, {"key": "3276a47234f0aa9eb7d4d06940ffb912be059454", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.001304506709515684, "ground_truth": 0}, {"key": "3276a47234f0aa9eb7d4d06940ffb912be059454", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.03126191439806911, "ground_truth": 0}, {"key": "3276a47234f0aa9eb7d4d06940ffb912be059454", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.00429793857857261, "ground_truth": 0}, {"key": "8d3bb51d711ce00e3fff53625a70923985573834", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.18594720433795026, "ground_truth": 0}, {"key": "8d3bb51d711ce00e3fff53625a70923985573834", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.10818895301091115, "ground_truth": 0}, {"key": "8d3bb51d711ce00e3fff53625a70923985573834", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.37570647541254865, "ground_truth": 0}, {"key": "8d3bb51d711ce00e3fff53625a70923985573834", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.21011726572488423, "ground_truth": 0}, {"key": "8d3bb51d711ce00e3fff53625a70923985573834", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.10932482378153109, "ground_truth": 0}, {"key": "e43fc7e34d05a75894279f55935b25040a6d7017", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.1403362486943084, "ground_truth": 0}, {"key": "e43fc7e34d05a75894279f55935b25040a6d7017", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.16238002168134189, "ground_truth": 0}, {"key": "e43fc7e34d05a75894279f55935b25040a6d7017", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.08389038654595474, "ground_truth": 0}, {"key": "e43fc7e34d05a75894279f55935b25040a6d7017", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.07316472101140671, "ground_truth": 0}, {"key": "e43fc7e34d05a75894279f55935b25040a6d7017", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.5448013981339713, "ground_truth": 0}, {"key": "518daa3f4d9f4eb8d3e6dec7852c8b645d1ceb49", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.17781087127419404, "ground_truth": 0}, {"key": "518daa3f4d9f4eb8d3e6dec7852c8b645d1ceb49", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.808672312750658, "ground_truth": 0}, {"key": "518daa3f4d9f4eb8d3e6dec7852c8b645d1ceb49", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.3415824918333435, "ground_truth": 0}, {"key": "518daa3f4d9f4eb8d3e6dec7852c8b645d1ceb49", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.6477982112738724, "ground_truth": 0}, {"key": "518daa3f4d9f4eb8d3e6dec7852c8b645d1ceb49", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.7779753224004671, "ground_truth": 0}, {"key": "a86f10b66912e0221e9ad4d44c37fc7f4e138ed2", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.900529789428974, "ground_truth": 0}, {"key": "a86f10b66912e0221e9ad4d44c37fc7f4e138ed2", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.7924642546196474, "ground_truth": 0}, {"key": "a86f10b66912e0221e9ad4d44c37fc7f4e138ed2", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.7641884197187775, "ground_truth": 0}, {"key": "a86f10b66912e0221e9ad4d44c37fc7f4e138ed2", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.5448014095403524, "ground_truth": 0}, {"key": "a86f10b66912e0221e9ad4d44c37fc7f4e138ed2", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.8812065923823555, "ground_truth": 0}, {"key": "a34829c5a83a3ef39c34b57b65cc48c9bf11f14b", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.02315340933723184, "ground_truth": 0}, {"key": "a34829c5a83a3ef39c34b57b65cc48c9bf11f14b", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.14608725082175766, "ground_truth": 0}, {"key": "a34829c5a83a3ef39c34b57b65cc48c9bf11f14b", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.00978387547040816, "ground_truth": 0}, {"key": "a34829c5a83a3ef39c34b57b65cc48c9bf11f14b", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.01826427776791539, "ground_truth": 0}, {"key": "a34829c5a83a3ef39c34b57b65cc48c9bf11f14b", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.029090756326807944, "ground_truth": 0}, {"key": "05c6b2a21f9c0ffd5f0c76c9ce4c6d3d875fcf39", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.015967654018136154, "ground_truth": 0}, {"key": "05c6b2a21f9c0ffd5f0c76c9ce4c6d3d875fcf39", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.007785655090344926, "ground_truth": 0}, {"key": "05c6b2a21f9c0ffd5f0c76c9ce4c6d3d875fcf39", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.0019723356106926826, "ground_truth": 0}, {"key": "05c6b2a21f9c0ffd5f0c76c9ce4c6d3d875fcf39", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.004297938889852703, "ground_truth": 0}, {"key": "05c6b2a21f9c0ffd5f0c76c9ce4c6d3d875fcf39", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.017045316631140627, "ground_truth": 0}, {"key": "b3e6507640b009ed51c8c8f8be85d0b7fec5b579", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.14608724468871365, "ground_truth": 0}, {"key": "b3e6507640b009ed51c8c8f8be85d0b7fec5b579", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.4263215917603302, "ground_truth": 0}, {"key": "b3e6507640b009ed51c8c8f8be85d0b7fec5b579", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.42250463591190734, "ground_truth": 0}, {"key": "b3e6507640b009ed51c8c8f8be85d0b7fec5b579", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.24798744010347373, "ground_truth": 0}, {"key": "b3e6507640b009ed51c8c8f8be85d0b7fec5b579", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.22541660840729283, "ground_truth": 0}, {"key": "6e930c55a62640d218e4b94f39cb7c83b6ad9117", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.049589024485246734, "ground_truth": 0}, {"key": "6e930c55a62640d218e4b94f39cb7c83b6ad9117", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.03789242765806725, "ground_truth": 0}, {"key": "6e930c55a62640d218e4b94f39cb7c83b6ad9117", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.1993080130486978, "ground_truth": 0}, {"key": "6e930c55a62640d218e4b94f39cb7c83b6ad9117", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.19559407672332, "ground_truth": 0}, {"key": "6e930c55a62640d218e4b94f39cb7c83b6ad9117", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.21337717657131294, "ground_truth": 0}, {"key": "cd13c83364964da3b3659782e6ef0d2b3dc273b1", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.2958398710309522, "ground_truth": 0}, {"key": "cd13c83364964da3b3659782e6ef0d2b3dc273b1", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.3557748802390649, "ground_truth": 0}, {"key": "cd13c83364964da3b3659782e6ef0d2b3dc273b1", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.10970577474738569, "ground_truth": 0}, {"key": "cd13c83364964da3b3659782e6ef0d2b3dc273b1", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.09467770141011718, "ground_truth": 0}, {"key": "cd13c83364964da3b3659782e6ef0d2b3dc273b1", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.5660185096899928, "ground_truth": 0}, {"key": "328210eaa50ae54cc3d979958c1d2008faa27401", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.31573598145020804, "ground_truth": 0}, {"key": "328210eaa50ae54cc3d979958c1d2008faa27401", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.057918090055605276, "ground_truth": 0}, {"key": "328210eaa50ae54cc3d979958c1d2008faa27401", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.09334687553405036, "ground_truth": 0}, {"key": "328210eaa50ae54cc3d979958c1d2008faa27401", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.20434190339288838, "ground_truth": 0}, {"key": "328210eaa50ae54cc3d979958c1d2008faa27401", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.2056150560775014, "ground_truth": 0}, {"key": "b67b63d1da9cccd6e229d5755065d57dd1653feb", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.7310585495332277, "ground_truth": 0}, {"key": "b67b63d1da9cccd6e229d5755065d57dd1653feb", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.6297746165644269, "ground_truth": 0}, {"key": "b67b63d1da9cccd6e229d5755065d57dd1653feb", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.4571367260846988, "ground_truth": 0}, {"key": "b67b63d1da9cccd6e229d5755065d57dd1653feb", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.6757645992309391, "ground_truth": 0}, {"key": "b67b63d1da9cccd6e229d5755065d57dd1653feb", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.5954925591629211, "ground_truth": 0}, {"key": "e4c55cb4bb6e5418d8486fb7c9369b6c84b2716d", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.36296918369581876, "ground_truth": 0}, {"key": "e4c55cb4bb6e5418d8486fb7c9369b6c84b2716d", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.5945512671166361, "ground_truth": 0}, {"key": "e4c55cb4bb6e5418d8486fb7c9369b6c84b2716d", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.1955940805488359, "ground_truth": 0}, {"key": "e4c55cb4bb6e5418d8486fb7c9369b6c84b2716d", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.3629691988578188, "ground_truth": 0}, {"key": "e4c55cb4bb6e5418d8486fb7c9369b6c84b2716d", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.12421300368673543, "ground_truth": 0}, {"key": "544b165ad1d22a5dcbbab469a2aa7666c2868361", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.10158944464894466, "ground_truth": 0}, {"key": "544b165ad1d22a5dcbbab469a2aa7666c2868361", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.04958902356504377, "ground_truth": 0}, {"key": "544b165ad1d22a5dcbbab469a2aa7666c2868361", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.0474258718708058, "ground_truth": 0}, {"key": "544b165ad1d22a5dcbbab469a2aa7666c2868361", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.19559407740582677, "ground_truth": 0}, {"key": "544b165ad1d22a5dcbbab469a2aa7666c2868361", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.07423136664447696, "ground_truth": 0}, {"key": "2577ef64a22c06cf63cb244abfad9ecc46603208", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.0656048358425033, "ground_truth": 0}, {"key": "2577ef64a22c06cf63cb244abfad9ecc46603208", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.0453525784477645, "ground_truth": 0}, {"key": "2577ef64a22c06cf63cb244abfad9ecc46603208", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.0614240394812222, "ground_truth": 0}, {"key": "2577ef64a22c06cf63cb244abfad9ecc46603208", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.033844033585081465, "ground_truth": 0}, {"key": "2577ef64a22c06cf63cb244abfad9ecc46603208", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.0632505252338613, "ground_truth": 0}, {"key": "2a73430dd3232ad3da7570a5ac133d7f29a6b6c6", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.049589026193982, "ground_truth": 0}, {"key": "2a73430dd3232ad3da7570a5ac133d7f29a6b6c6", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.08850466368461003, "ground_truth": 0}, {"key": "2a73430dd3232ad3da7570a5ac133d7f29a6b6c6", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.26740817018470725, "ground_truth": 0}, {"key": "2a73430dd3232ad3da7570a5ac133d7f29a6b6c6", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.11516223237666288, "ground_truth": 0}, {"key": "2a73430dd3232ad3da7570a5ac133d7f29a6b6c6", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.027272669490225016, "ground_truth": 0}, {"key": "8fbcaf3abc124b7baaa278d382411f43e7e48353", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.06632686946651664, "ground_truth": 0}, {"key": "8fbcaf3abc124b7baaa278d382411f43e7e48353", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.19868535637980728, "ground_truth": 0}, {"key": "8fbcaf3abc124b7baaa278d382411f43e7e48353", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.22953520110461498, "ground_truth": 0}, {"key": "8fbcaf3abc124b7baaa278d382411f43e7e48353", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.4054487213746099, "ground_truth": 0}, {"key": "8fbcaf3abc124b7baaa278d382411f43e7e48353", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.3998116597948214, "ground_truth": 0}, {"key": "bc04e5a298854589044eb5a162f281f3e7e12c16", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.018833130355588368, "ground_truth": 0}, {"key": "bc04e5a298854589044eb5a162f281f3e7e12c16", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.09467770384403609, "ground_truth": 0}, {"key": "bc04e5a298854589044eb5a162f281f3e7e12c16", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.07978201457094665, "ground_truth": 0}, {"key": "bc04e5a298854589044eb5a162f281f3e7e12c16", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.07263671006337252, "ground_truth": 0}, {"key": "bc04e5a298854589044eb5a162f281f3e7e12c16", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.015603533971208327, "ground_truth": 0}, {"key": "8c3b7358950d0684a90736fc39d08340d3ec41ee", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.057071397467897314, "ground_truth": 0}, {"key": "8c3b7358950d0684a90736fc39d08340d3ec41ee", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.585101154064009, "ground_truth": 0}, {"key": "8c3b7358950d0684a90736fc39d08340d3ec41ee", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.5019531108398511, "ground_truth": 0}, {"key": "8c3b7358950d0684a90736fc39d08340d3ec41ee", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.18832398019741176, "ground_truth": 0}, {"key": "8c3b7358950d0684a90736fc39d08340d3ec41ee", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.06465349067530844, "ground_truth": 0}, {"key": "d1a86381ca59e3471d2863688229922f83218150", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.364777559860252, "ground_truth": 0}, {"key": "d1a86381ca59e3471d2863688229922f83218150", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.19498022084391667, "ground_truth": 0}, {"key": "d1a86381ca59e3471d2863688229922f83218150", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.2925953043139628, "ground_truth": 0}, {"key": "d1a86381ca59e3471d2863688229922f83218150", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.13660839473016517, "ground_truth": 0}, {"key": "d1a86381ca59e3471d2863688229922f83218150", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.33025516642686426, "ground_truth": 0}, {"key": "313d98f4c6047ff556795b6da47e42e9f650946a", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.06394842319807834, "ground_truth": 0}, {"key": "313d98f4c6047ff556795b6da47e42e9f650946a", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.03993731526611711, "ground_truth": 0}, {"key": "313d98f4c6047ff556795b6da47e42e9f650946a", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.09073548602003995, "ground_truth": 0}, {"key": "313d98f4c6047ff556795b6da47e42e9f650946a", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.03333682538406786, "ground_truth": 0}, {"key": "313d98f4c6047ff556795b6da47e42e9f650946a", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.04922211643815716, "ground_truth": 0}, {"key": "8c0934c689bbc9234dc51eff9d8d156aec106ca4", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.19559408091469965, "ground_truth": 0}, {"key": "8c0934c689bbc9234dc51eff9d8d156aec106ca4", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.24220563841082213, "ground_truth": 0}, {"key": "8c0934c689bbc9234dc51eff9d8d156aec106ca4", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.07004895971384167, "ground_truth": 0}, {"key": "8c0934c689bbc9234dc51eff9d8d156aec106ca4", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.27669051984822124, "ground_truth": 0}, {"key": "8c0934c689bbc9234dc51eff9d8d156aec106ca4", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.20946969048225197, "ground_truth": 0}, {"key": "70f210b63211c32ab22354506b7bd9b80ee194af", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.528290064329331, "ground_truth": 0}, {"key": "70f210b63211c32ab22354506b7bd9b80ee194af", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.8316905590096738, "ground_truth": 0}, {"key": "70f210b63211c32ab22354506b7bd9b80ee194af", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.34070450009172, "ground_truth": 0}, {"key": "70f210b63211c32ab22354506b7bd9b80ee194af", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.4359015078637142, "ground_truth": 0}, {"key": "70f210b63211c32ab22354506b7bd9b80ee194af", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.4882834080309882, "ground_truth": 0}, {"key": "dea4bf4a53b568dea8b3d5009a24d090485be8c9", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.0812277521427774, "ground_truth": 0}, {"key": "dea4bf4a53b568dea8b3d5009a24d090485be8c9", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.16451645855006927, "ground_truth": 0}, {"key": "dea4bf4a53b568dea8b3d5009a24d090485be8c9", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.05856082401097754, "ground_truth": 0}, {"key": "dea4bf4a53b568dea8b3d5009a24d090485be8c9", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.10970577126418382, "ground_truth": 0}, {"key": "dea4bf4a53b568dea8b3d5009a24d090485be8c9", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.18952109838289907, "ground_truth": 0}, {"key": "3ffb4210cf832dc039ffe7522c47c6eb7a5e5ab5", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.05877655806105242, "ground_truth": 0}, {"key": "3ffb4210cf832dc039ffe7522c47c6eb7a5e5ab5", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.08632347628391883, "ground_truth": 0}, {"key": "3ffb4210cf832dc039ffe7522c47c6eb7a5e5ab5", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.04336579995585337, "ground_truth": 0}, {"key": "3ffb4210cf832dc039ffe7522c47c6eb7a5e5ab5", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.0204103077447562, "ground_truth": 0}, {"key": "3ffb4210cf832dc039ffe7522c47c6eb7a5e5ab5", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.05707139983650839, "ground_truth": 0}, {"key": "c010d72bf64ac4e1c758b7f078aeed89bc57a9db", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.04146227480964763, "ground_truth": 0}, {"key": "c010d72bf64ac4e1c758b7f078aeed89bc57a9db", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.039195128682252244, "ground_truth": 0}, {"key": "c010d72bf64ac4e1c758b7f078aeed89bc57a9db", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.08882028494887803, "ground_truth": 0}, {"key": "c010d72bf64ac4e1c758b7f078aeed89bc57a9db", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.09602549176872564, "ground_truth": 0}, {"key": "c010d72bf64ac4e1c758b7f078aeed89bc57a9db", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.08151974999767142, "ground_truth": 0}, {"key": "343644770a597a2dfa7548ba165fa9c6bdc88245", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.04569203302966486, "ground_truth": 0}, {"key": "343644770a597a2dfa7548ba165fa9c6bdc88245", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.026056304369646316, "ground_truth": 0}, {"key": "343644770a597a2dfa7548ba165fa9c6bdc88245", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.031618768081755094, "ground_truth": 0}, {"key": "343644770a597a2dfa7548ba165fa9c6bdc88245", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.08509904151382575, "ground_truth": 0}, {"key": "343644770a597a2dfa7548ba165fa9c6bdc88245", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.028220988155719315, "ground_truth": 0}, {"key": "4b89e8a6a25de61d21a1fed20fb911cd4b1e4b47", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.03846619145424154, "ground_truth": 0}, {"key": "4b89e8a6a25de61d21a1fed20fb911cd4b1e4b47", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.06656918831381274, "ground_truth": 0}, {"key": "4b89e8a6a25de61d21a1fed20fb911cd4b1e4b47", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.01578456156204954, "ground_truth": 0}, {"key": "4b89e8a6a25de61d21a1fed20fb911cd4b1e4b47", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.0641826411573087, "ground_truth": 0}, {"key": "4b89e8a6a25de61d21a1fed20fb911cd4b1e4b47", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.03904829409935959, "ground_truth": 0}, {"key": "9b382d27692cb18aa61af350038b175b3ce75e2b", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.073696276879014, "ground_truth": 0}, {"key": "9b382d27692cb18aa61af350038b175b3ce75e2b", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.03861092954193782, "ground_truth": 0}, {"key": "9b382d27692cb18aa61af350038b175b3ce75e2b", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.07751765565246145, "ground_truth": 0}, {"key": "9b382d27692cb18aa61af350038b175b3ce75e2b", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.030792164595802255, "ground_truth": 0}, {"key": "9b382d27692cb18aa61af350038b175b3ce75e2b", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.05856082686554336, "ground_truth": 0}, {"key": "59be27355e5b86754678f70254cfbb1e6dc8bf0c", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.014392336722692085, "ground_truth": 0}, {"key": "59be27355e5b86754678f70254cfbb1e6dc8bf0c", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.024330189327882862, "ground_truth": 0}, {"key": "59be27355e5b86754678f70254cfbb1e6dc8bf0c", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.0034296037076125266, "ground_truth": 0}, {"key": "59be27355e5b86754678f70254cfbb1e6dc8bf0c", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.010652511450976787, "ground_truth": 0}, {"key": "59be27355e5b86754678f70254cfbb1e6dc8bf0c", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.06348235593711622, "ground_truth": 0}, {"key": "ff10934c1dc127286575fb1a6b192da6da21f235", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.05300977027751168, "ground_truth": 0}, {"key": "ff10934c1dc127286575fb1a6b192da6da21f235", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.0644176655218192, "ground_truth": 0}, {"key": "ff10934c1dc127286575fb1a6b192da6da21f235", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.0832919291994809, "ground_truth": 0}, {"key": "ff10934c1dc127286575fb1a6b192da6da21f235", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.06730107839062419, "ground_truth": 0}, {"key": "ff10934c1dc127286575fb1a6b192da6da21f235", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.05877655882540819, "ground_truth": 0}, {"key": "1997690ceabc952c3396cb2a30e9050241f6f6c7", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.24364245708481522, "ground_truth": 0}, {"key": "1997690ceabc952c3396cb2a30e9050241f6f6c7", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.6315942910122365, "ground_truth": 0}, {"key": "1997690ceabc952c3396cb2a30e9050241f6f6c7", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.36116472371146113, "ground_truth": 0}, {"key": "1997690ceabc952c3396cb2a30e9050241f6f6c7", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.03993731567778807, "ground_truth": 0}, {"key": "1997690ceabc952c3396cb2a30e9050241f6f6c7", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.5331543875503562, "ground_truth": 0}, {"key": "c676027eea6109621206e3864c4eea30912fe09f", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.29098087316332916, "ground_truth": 0}, {"key": "c676027eea6109621206e3864c4eea30912fe09f", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.14414885939462252, "ground_truth": 0}, {"key": "c676027eea6109621206e3864c4eea30912fe09f", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.19930800191095374, "ground_truth": 0}, {"key": "c676027eea6109621206e3864c4eea30912fe09f", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.1907240266937815, "ground_truth": 0}, {"key": "c676027eea6109621206e3864c4eea30912fe09f", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.3090237117453638, "ground_truth": 0}, {"key": "78e22dd79495204cf719e3728927241bb60b80e1", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.22270014458941426, "ground_truth": 0}, {"key": "78e22dd79495204cf719e3728927241bb60b80e1", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.16344544404251196, "ground_truth": 0}, {"key": "78e22dd79495204cf719e3728927241bb60b80e1", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.1871326903391045, "ground_truth": 0}, {"key": "78e22dd79495204cf719e3728927241bb60b80e1", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.19559407744072632, "ground_truth": 0}, {"key": "78e22dd79495204cf719e3728927241bb60b80e1", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.4282333872888121, "ground_truth": 0}, {"key": "6c1a1cf59028ba2567b0a1941e510c40133da1c0", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.5058591103988311, "ground_truth": 0}, {"key": "6c1a1cf59028ba2567b0a1941e510c40133da1c0", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.6334102511707069, "ground_truth": 0}, {"key": "6c1a1cf59028ba2567b0a1941e510c40133da1c0", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.1677633443874689, "ground_truth": 0}, {"key": "6c1a1cf59028ba2567b0a1941e510c40133da1c0", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.23792990532943453, "ground_truth": 0}, {"key": "6c1a1cf59028ba2567b0a1941e510c40133da1c0", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.2925953165617689, "ground_truth": 0}, {"key": "e8bbd5a77edf96611a4b8efcfbc625ec65985e98", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.014615669464029788, "ground_truth": 0}, {"key": "e8bbd5a77edf96611a4b8efcfbc625ec65985e98", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.13251456711933066, "ground_truth": 0}, {"key": "e8bbd5a77edf96611a4b8efcfbc625ec65985e98", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.2018132162705481, "ground_truth": 0}, {"key": "e8bbd5a77edf96611a4b8efcfbc625ec65985e98", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.2509127916073285, "ground_truth": 0}, {"key": "e8bbd5a77edf96611a4b8efcfbc625ec65985e98", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.105948278140824, "ground_truth": 0}, {"key": "4141e012912dbf29c5e792b8654a9a36094b468c", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.05500528774617115, "ground_truth": 0}, {"key": "4141e012912dbf29c5e792b8654a9a36094b468c", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.008985428686101348, "ground_truth": 0}, {"key": "4141e012912dbf29c5e792b8654a9a36094b468c", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.05419873057545651, "ground_truth": 0}, {"key": "4141e012912dbf29c5e792b8654a9a36094b468c", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.08389038304830165, "ground_truth": 0}, {"key": "4141e012912dbf29c5e792b8654a9a36094b468c", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.024987794673563976, "ground_truth": 0}, {"key": "d80fa94dc14601e4b82321e2cf749d6915251a70", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.05070536410305868, "ground_truth": 0}, {"key": "d80fa94dc14601e4b82321e2cf749d6915251a70", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.027585282639562208, "ground_truth": 0}, {"key": "d80fa94dc14601e4b82321e2cf749d6915251a70", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.03541073001648795, "ground_truth": 0}, {"key": "d80fa94dc14601e4b82321e2cf749d6915251a70", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.19436781452590285, "ground_truth": 0}, {"key": "d80fa94dc14601e4b82321e2cf749d6915251a70", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.040540736441222955, "ground_truth": 0}, {"key": "11e57b8ed79c4f4b110d81a5cd7152d42411c7a6", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.09268778317843832, "ground_truth": 0}, {"key": "11e57b8ed79c4f4b110d81a5cd7152d42411c7a6", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.09602549015294491, "ground_truth": 0}, {"key": "11e57b8ed79c4f4b110d81a5cd7152d42411c7a6", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.09138210695563939, "ground_truth": 0}, {"key": "11e57b8ed79c4f4b110d81a5cd7152d42411c7a6", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.14804719080884, "ground_truth": 0}, {"key": "11e57b8ed79c4f4b110d81a5cd7152d42411c7a6", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.14903530803554874, "ground_truth": 0}, {"key": "b55c390e81c5d1d4fa077338d9daaed8978f710b", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.07290026951506988, "ground_truth": 0}, {"key": "b55c390e81c5d1d4fa077338d9daaed8978f710b", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.012241275921862823, "ground_truth": 0}, {"key": "b55c390e81c5d1d4fa077338d9daaed8978f710b", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.06394841801293873, "ground_truth": 0}, {"key": "b55c390e81c5d1d4fa077338d9daaed8978f710b", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.08006925837915656, "ground_truth": 0}, {"key": "b55c390e81c5d1d4fa077338d9daaed8978f710b", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.028870906735024026, "ground_truth": 0}, {"key": "d46e1849cbbf875ccd018fd778fa6c433cab4694", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.15817435405506322, "ground_truth": 0}, {"key": "d46e1849cbbf875ccd018fd778fa6c433cab4694", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.05707140091486633, "ground_truth": 0}, {"key": "d46e1849cbbf875ccd018fd778fa6c433cab4694", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.014559519626612966, "ground_truth": 0}, {"key": "d46e1849cbbf875ccd018fd778fa6c433cab4694", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.08725224762018893, "ground_truth": 0}, {"key": "d46e1849cbbf875ccd018fd778fa6c433cab4694", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.1623800356048101, "ground_truth": 0}, {"key": "09b582acc63514f671628e1766ff7e99b258fe9a", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.03676946281284838, "ground_truth": 0}, {"key": "09b582acc63514f671628e1766ff7e99b258fe9a", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.2583259734926897, "ground_truth": 0}, {"key": "09b582acc63514f671628e1766ff7e99b258fe9a", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.29098085375009336, "ground_truth": 0}, {"key": "09b582acc63514f671628e1766ff7e99b258fe9a", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.02800752210765109, "ground_truth": 0}, {"key": "09b582acc63514f671628e1766ff7e99b258fe9a", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.038756197706439705, "ground_truth": 0}, {"key": "c4afe4db222c094c40bb3f271e37e006bcbebf88", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.12168575391054709, "ground_truth": 0}, {"key": "c4afe4db222c094c40bb3f271e37e006bcbebf88", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.05665242536601786, "ground_truth": 0}, {"key": "c4afe4db222c094c40bb3f271e37e006bcbebf88", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.23370634583730307, "ground_truth": 0}, {"key": "c4afe4db222c094c40bb3f271e37e006bcbebf88", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.09138210623203041, "ground_truth": 0}, {"key": "c4afe4db222c094c40bb3f271e37e006bcbebf88", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.07807816351263212, "ground_truth": 0}, {"key": "e21871892c63ec9638bf1bd3c3a1c3ebdae88796", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.15507848012258815, "ground_truth": 0}, {"key": "e21871892c63ec9638bf1bd3c3a1c3ebdae88796", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.13206614647105694, "ground_truth": 0}, {"key": "e21871892c63ec9638bf1bd3c3a1c3ebdae88796", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.14414885010657358, "ground_truth": 0}, {"key": "e21871892c63ec9638bf1bd3c3a1c3ebdae88796", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.07133200236809616, "ground_truth": 0}, {"key": "e21871892c63ec9638bf1bd3c3a1c3ebdae88796", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.14608724793916625, "ground_truth": 0}, {"key": "065378e265a6d5ff38b2e6748ba66490cf8670a9", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.26740816244505694, "ground_truth": 0}, {"key": "065378e265a6d5ff38b2e6748ba66490cf8670a9", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.240774589795666, "ground_truth": 0}, {"key": "065378e265a6d5ff38b2e6748ba66490cf8670a9", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.16667538905218465, "ground_truth": 0}, {"key": "065378e265a6d5ff38b2e6748ba66490cf8670a9", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.14706453177607917, "ground_truth": 0}, {"key": "065378e265a6d5ff38b2e6748ba66490cf8670a9", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.18952109840454778, "ground_truth": 0}, {"key": "5852e143b34cc30e94aed29193fc2e1dce37b1b1", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.06804042465954772, "ground_truth": 0}, {"key": "5852e143b34cc30e94aed29193fc2e1dce37b1b1", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.14463143963057243, "ground_truth": 0}, {"key": "5852e143b34cc30e94aed29193fc2e1dce37b1b1", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.08663206815575948, "ground_truth": 0}, {"key": "5852e143b34cc30e94aed29193fc2e1dce37b1b1", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.16830944582092308, "ground_truth": 0}, {"key": "5852e143b34cc30e94aed29193fc2e1dce37b1b1", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.07159120408994114, "ground_truth": 0}, {"key": "af76b4c33b65666487dcc07f75d37de03ff61207", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.5448013867972088, "ground_truth": 0}, {"key": "af76b4c33b65666487dcc07f75d37de03ff61207", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.3056973102758328, "ground_truth": 0}, {"key": "af76b4c33b65666487dcc07f75d37de03ff61207", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.2628418519675263, "ground_truth": 0}, {"key": "af76b4c33b65666487dcc07f75d37de03ff61207", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.22135067999588529, "ground_truth": 0}, {"key": "af76b4c33b65666487dcc07f75d37de03ff61207", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.3328523331779798, "ground_truth": 0}, {"key": "9918924dbaed44429c58ea3638c3847317b71127", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.07263670990960924, "ground_truth": 0}, {"key": "9918924dbaed44429c58ea3638c3847317b71127", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.1175721388648333, "ground_truth": 0}, {"key": "9918924dbaed44429c58ea3638c3847317b71127", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.07423137072014678, "ground_truth": 0}, {"key": "9918924dbaed44429c58ea3638c3847317b71127", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.055823143717072476, "ground_truth": 0}, {"key": "9918924dbaed44429c58ea3638c3847317b71127", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.16451644583017075, "ground_truth": 0}, {"key": "c87e99f422b46c03ce77e7cd064bff87c076e1ed", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.14414885840078645, "ground_truth": 0}, {"key": "c87e99f422b46c03ce77e7cd064bff87c076e1ed", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.2674081622792134, "ground_truth": 0}, {"key": "c87e99f422b46c03ce77e7cd064bff87c076e1ed", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.10338597039637529, "ground_truth": 0}, {"key": "c87e99f422b46c03ce77e7cd064bff87c076e1ed", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.08509904084420944, "ground_truth": 0}, {"key": "c87e99f422b46c03ce77e7cd064bff87c076e1ed", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.06418264479527169, "ground_truth": 0}, {"key": "aaca402152fbea1b16e14999374f6394520289a8", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.16344542480471572, "ground_truth": 0}, {"key": "aaca402152fbea1b16e14999374f6394520289a8", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.18713268012733217, "ground_truth": 0}, {"key": "aaca402152fbea1b16e14999374f6394520289a8", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.24508501188543608, "ground_truth": 0}, {"key": "aaca402152fbea1b16e14999374f6394520289a8", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.2991051908708388, "ground_truth": 0}, {"key": "aaca402152fbea1b16e14999374f6394520289a8", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.11757213462404653, "ground_truth": 0}, {"key": "259d8cccfcb9b9edc00d757ec6efecde6fc06110", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.050893719232851284, "ground_truth": 0}, {"key": "259d8cccfcb9b9edc00d757ec6efecde6fc06110", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.070559599878992, "ground_truth": 0}, {"key": "259d8cccfcb9b9edc00d757ec6efecde6fc06110", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.19072402685693443, "ground_truth": 0}, {"key": "259d8cccfcb9b9edc00d757ec6efecde6fc06110", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.17217185555063141, "ground_truth": 0}, {"key": "259d8cccfcb9b9edc00d757ec6efecde6fc06110", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.11757213965218458, "ground_truth": 0}, {"key": "d076dbce6e84b20153db61c809d0f01f46ef1f45", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.06052938831826741, "ground_truth": 0}, {"key": "d076dbce6e84b20153db61c809d0f01f46ef1f45", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.07921031989341994, "ground_truth": 0}, {"key": "d076dbce6e84b20153db61c809d0f01f46ef1f45", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.04099902689180125, "ground_truth": 0}, {"key": "d076dbce6e84b20153db61c809d0f01f46ef1f45", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.1398656467195204, "ground_truth": 0}, {"key": "d076dbce6e84b20153db61c809d0f01f46ef1f45", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.1375324724494835, "ground_truth": 0}, {"key": "c74e983d24450ed9c4ba3a97e345bba707d26853", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.035410728107107964, "ground_truth": 0}, {"key": "c74e983d24450ed9c4ba3a97e345bba707d26853", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.018546564341339892, "ground_truth": 0}, {"key": "c74e983d24450ed9c4ba3a97e345bba707d26853", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.03904828829220991, "ground_truth": 0}, {"key": "c74e983d24450ed9c4ba3a97e345bba707d26853", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.029535338049422155, "ground_truth": 0}, {"key": "c74e983d24450ed9c4ba3a97e345bba707d26853", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.02112519356884855, "ground_truth": 0}, {"key": "0922357b2d0439cf4ba6ec9dc143e11a38b49d8a", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.013689477594194869, "ground_truth": 0}, {"key": "0922357b2d0439cf4ba6ec9dc143e11a38b49d8a", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.06142404036780128, "ground_truth": 0}, {"key": "0922357b2d0439cf4ba6ec9dc143e11a38b49d8a", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.0680404208983164, "ground_truth": 0}, {"key": "0922357b2d0439cf4ba6ec9dc143e11a38b49d8a", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.007665874537789094, "ground_truth": 0}, {"key": "0922357b2d0439cf4ba6ec9dc143e11a38b49d8a", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.024798161597673306, "ground_truth": 0}, {"key": "c62ea6aaf31a7f5b6a7c2eac7780c86f9baed786", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.1267851742642701, "ground_truth": 0}, {"key": "c62ea6aaf31a7f5b6a7c2eac7780c86f9baed786", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.26894145134589975, "ground_truth": 0}, {"key": "c62ea6aaf31a7f5b6a7c2eac7780c86f9baed786", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.2227001393064658, "ground_truth": 0}, {"key": "c62ea6aaf31a7f5b6a7c2eac7780c86f9baed786", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.156104905539994, "ground_truth": 0}, {"key": "c62ea6aaf31a7f5b6a7c2eac7780c86f9baed786", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.4282333890197302, "ground_truth": 0}, {"key": "6bb04883f35820a450ff821eda46a4002c0fc7e9", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.07211220182146888, "ground_truth": 0}, {"key": "6bb04883f35820a450ff821eda46a4002c0fc7e9", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.019719126292585334, "ground_truth": 0}, {"key": "6bb04883f35820a450ff821eda46a4002c0fc7e9", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.054600605921163226, "ground_truth": 0}, {"key": "6bb04883f35820a450ff821eda46a4002c0fc7e9", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.08449276082871672, "ground_truth": 0}, {"key": "6bb04883f35820a450ff821eda46a4002c0fc7e9", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.04569202909643787, "ground_truth": 0}, {"key": "71f87a7cbda73f1c0656d811b0026437e4ee4aa0", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.3539862915375987, "ground_truth": 0}, {"key": "71f87a7cbda73f1c0656d811b0026437e4ee4aa0", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.6486889362277423, "ground_truth": 0}, {"key": "71f87a7cbda73f1c0656d811b0026437e4ee4aa0", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.6859494403352498, "ground_truth": 0}, {"key": "71f87a7cbda73f1c0656d811b0026437e4ee4aa0", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.4824291191323285, "ground_truth": 0}, {"key": "71f87a7cbda73f1c0656d811b0026437e4ee4aa0", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.39606817096345004, "ground_truth": 0}, {"key": "fa5089d759a9fb810d28c140cf60e3a5fffff8ba", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.14223189306362083, "ground_truth": 0}, {"key": "fa5089d759a9fb810d28c140cf60e3a5fffff8ba", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.45132651291203424, "ground_truth": 0}, {"key": "fa5089d759a9fb810d28c140cf60e3a5fffff8ba", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.0397878101946661, "ground_truth": 0}, {"key": "fa5089d759a9fb810d28c140cf60e3a5fffff8ba", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.6967842433156818, "ground_truth": 0}, {"key": "fa5089d759a9fb810d28c140cf60e3a5fffff8ba", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.48340453644469655, "ground_truth": 0}, {"key": "1f9aed77465301d7f3787a29555754a03728c4b7", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.024145423137279756, "ground_truth": 0}, {"key": "1f9aed77465301d7f3787a29555754a03728c4b7", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.02748069393209859, "ground_truth": 0}, {"key": "1f9aed77465301d7f3787a29555754a03728c4b7", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.06278920951112192, "ground_truth": 0}, {"key": "1f9aed77465301d7f3787a29555754a03728c4b7", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.053403332925533, "ground_truth": 0}, {"key": "1f9aed77465301d7f3787a29555754a03728c4b7", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.019568676291575108, "ground_truth": 0}, {"key": "7237201bcb7291f2ededb818f901a451356db34b", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.10052486277891495, "ground_truth": 0}, {"key": "7237201bcb7291f2ededb818f901a451356db34b", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.16026603529685285, "ground_truth": 0}, {"key": "7237201bcb7291f2ededb818f901a451356db34b", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.18832399066757133, "ground_truth": 0}, {"key": "7237201bcb7291f2ededb818f901a451356db34b", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.026255301254798597, "ground_truth": 0}, {"key": "7237201bcb7291f2ededb818f901a451356db34b", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.1097057695648288, "ground_truth": 0}, {"key": "38d13d78fedc889784ffb3cb213a758c758be145", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.004503272735546869, "ground_truth": 0}, {"key": "38d13d78fedc889784ffb3cb213a758c758be145", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.06142404036780128, "ground_truth": 0}, {"key": "38d13d78fedc889784ffb3cb213a758c758be145", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.042562732110314014, "ground_truth": 0}, {"key": "38d13d78fedc889784ffb3cb213a758c758be145", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.009303948374722, "ground_truth": 0}, {"key": "38d13d78fedc889784ffb3cb213a758c758be145", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.03173859082020869, "ground_truth": 0}, {"key": "98fd4b91ec12241a96493471a3e21c9ab96ec523", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.14223188534505693, "ground_truth": 0}, {"key": "98fd4b91ec12241a96493471a3e21c9ab96ec523", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.17441027028155195, "ground_truth": 0}, {"key": "98fd4b91ec12241a96493471a3e21c9ab96ec523", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.10017221764421501, "ground_truth": 0}, {"key": "98fd4b91ec12241a96493471a3e21c9ab96ec523", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.1980641694372485, "ground_truth": 0}, {"key": "98fd4b91ec12241a96493471a3e21c9ab96ec523", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.10158945033604556, "ground_truth": 0}, {"key": "8cefdd23a829375abeb18b9bd44bb053a67dfdf8", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.019568674887631806, "ground_truth": 0}, {"key": "8cefdd23a829375abeb18b9bd44bb053a67dfdf8", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.1520322558982572, "ground_truth": 0}, {"key": "8cefdd23a829375abeb18b9bd44bb053a67dfdf8", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.11676401504721187, "ground_truth": 0}, {"key": "8cefdd23a829375abeb18b9bd44bb053a67dfdf8", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.028652668031594157, "ground_truth": 0}, {"key": "8cefdd23a829375abeb18b9bd44bb053a67dfdf8", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.09009299774609991, "ground_truth": 0}, {"key": "3de916a84cae6c1dee0076f4e5d6e26fc95c3242", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.06394842060290609, "ground_truth": 0}, {"key": "3de916a84cae6c1dee0076f4e5d6e26fc95c3242", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.05340333375642503, "ground_truth": 0}, {"key": "3de916a84cae6c1dee0076f4e5d6e26fc95c3242", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.05051766968268257, "ground_truth": 0}, {"key": "3de916a84cae6c1dee0076f4e5d6e26fc95c3242", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.029423579846646234, "ground_truth": 0}, {"key": "3de916a84cae6c1dee0076f4e5d6e26fc95c3242", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.0646534881299474, "ground_truth": 0}, {"key": "24611abacb038c28a84c76b10165e474ac0fdd7e", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.05261895450324295, "ground_truth": 0}, {"key": "24611abacb038c28a84c76b10165e474ac0fdd7e", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.0946777048597776, "ground_truth": 0}, {"key": "24611abacb038c28a84c76b10165e474ac0fdd7e", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.07531230439570745, "ground_truth": 0}, {"key": "24611abacb038c28a84c76b10165e474ac0fdd7e", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.0605293884108693, "ground_truth": 0}, {"key": "24611abacb038c28a84c76b10165e474ac0fdd7e", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.13939639027586942, "ground_truth": 0}, {"key": "4f3178963b84a0e3625f7486b045872c665073d7", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.4960938398246146, "ground_truth": 0}, {"key": "4f3178963b84a0e3625f7486b045872c665073d7", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.7416740255247903, "ground_truth": 0}, {"key": "4f3178963b84a0e3625f7486b045872c665073d7", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.7711548556945508, "ground_truth": 0}, {"key": "4f3178963b84a0e3625f7486b045872c665073d7", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.4921881357703466, "ground_truth": 0}, {"key": "4f3178963b84a0e3625f7486b045872c665073d7", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.7341195412923059, "ground_truth": 0}, {"key": "6ff0470115b556c80229f4305c23afa683c9f8da", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.023599297777600954, "ground_truth": 0}, {"key": "6ff0470115b556c80229f4305c23afa683c9f8da", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.21337717491273708, "ground_truth": 0}, {"key": "6ff0470115b556c80229f4305c23afa683c9f8da", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.07369627516100503, "ground_truth": 0}, {"key": "6ff0470115b556c80229f4305c23afa683c9f8da", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.04336580079355191, "ground_truth": 0}, {"key": "6ff0470115b556c80229f4305c23afa683c9f8da", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.1441488555817541, "ground_truth": 0}, {"key": "4be9a7e5e9115eb681541c4a8d247ac84f0eb774", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.15713685364680646, "ground_truth": 0}, {"key": "4be9a7e5e9115eb681541c4a8d247ac84f0eb774", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.2043419031468336, "ground_truth": 0}, {"key": "4be9a7e5e9115eb681541c4a8d247ac84f0eb774", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.2068940597548922, "ground_truth": 0}, {"key": "4be9a7e5e9115eb681541c4a8d247ac84f0eb774", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.2024431682053394, "ground_truth": 0}, {"key": "4be9a7e5e9115eb681541c4a8d247ac84f0eb774", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.2068940606265919, "ground_truth": 0}, {"key": "de3ba4e29501a10effcbb5a61e7b9c0ab3721669", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.9213576195850345, "ground_truth": 0}, {"key": "de3ba4e29501a10effcbb5a61e7b9c0ab3721669", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.9069831909343785, "ground_truth": 0}, {"key": "de3ba4e29501a10effcbb5a61e7b9c0ab3721669", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.8705972720561892, "ground_truth": 0}, {"key": "de3ba4e29501a10effcbb5a61e7b9c0ab3721669", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.8962513716949966, "ground_truth": 0}, {"key": "de3ba4e29501a10effcbb5a61e7b9c0ab3721669", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.910545394438545, "ground_truth": 0}, {"key": "d23090b75384c925e7f20b1ec5218394b52eae38", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.16451645230671635, "ground_truth": 0}, {"key": "d23090b75384c925e7f20b1ec5218394b52eae38", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.5679366016702104, "ground_truth": 0}, {"key": "d23090b75384c925e7f20b1ec5218394b52eae38", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.5, "ground_truth": 0}, {"key": "d23090b75384c925e7f20b1ec5218394b52eae38", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.7943849538091574, "ground_truth": 0}, {"key": "d23090b75384c925e7f20b1ec5218394b52eae38", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.5078118682556774, "ground_truth": 0}, {"key": "98008fdd5ea99bc7c437d6e1aa86c750bf667415", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.17106118288044764, "ground_truth": 0}, {"key": "98008fdd5ea99bc7c437d6e1aa86c750bf667415", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.02460992819113597, "ground_truth": 0}, {"key": "98008fdd5ea99bc7c437d6e1aa86c750bf667415", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.24944724813061372, "ground_truth": 0}, {"key": "98008fdd5ea99bc7c437d6e1aa86c750bf667415", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.3345894558713795, "ground_truth": 0}, {"key": "98008fdd5ea99bc7c437d6e1aa86c750bf667415", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.06097518070894057, "ground_truth": 0}, {"key": "fd13c81373473f862d0f3559ffbc2a03fa95f492", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.04813676879453435, "ground_truth": 0}, {"key": "fd13c81373473f862d0f3559ffbc2a03fa95f492", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.010611421329778374, "ground_truth": 0}, {"key": "fd13c81373473f862d0f3559ffbc2a03fa95f492", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.10087862418652353, "ground_truth": 0}, {"key": "fd13c81373473f862d0f3559ffbc2a03fa95f492", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.08819004374732214, "ground_truth": 0}, {"key": "fd13c81373473f862d0f3559ffbc2a03fa95f492", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.013742321057948328, "ground_truth": 0}, {"key": "ad275932d9fb03762cc781e06955fb088e165ad9", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.07921031880253065, "ground_truth": 0}, {"key": "ad275932d9fb03762cc781e06955fb088e165ad9", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.1361483216451679, "ground_truth": 0}, {"key": "ad275932d9fb03762cc781e06955fb088e165ad9", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.08882029177839658, "ground_truth": 0}, {"key": "ad275932d9fb03762cc781e06955fb088e165ad9", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.03846619668334544, "ground_truth": 0}, {"key": "ad275932d9fb03762cc781e06955fb088e165ad9", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.009974921609939175, "ground_truth": 0}, {"key": "f9fedde4734d8ac3431c0ed5d338efcd799b1aea", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.4016878061219657, "ground_truth": 0}, {"key": "f9fedde4734d8ac3431c0ed5d338efcd799b1aea", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.46490156806497696, "ground_truth": 0}, {"key": "f9fedde4734d8ac3431c0ed5d338efcd799b1aea", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.5078118812033329, "ground_truth": 0}, {"key": "f9fedde4734d8ac3431c0ed5d338efcd799b1aea", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.46879062302035246, "ground_truth": 0}, {"key": "f9fedde4734d8ac3431c0ed5d338efcd799b1aea", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.5039061689266978, "ground_truth": 0}, {"key": "bbe84a85e38aac4e2cff76da7ce4ed349474db25", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.1081889550876912, "ground_truth": 0}, {"key": "bbe84a85e38aac4e2cff76da7ce4ed349474db25", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.35220178915524175, "ground_truth": 0}, {"key": "bbe84a85e38aac4e2cff76da7ce4ed349474db25", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.32252598323889303, "ground_truth": 0}, {"key": "bbe84a85e38aac4e2cff76da7ce4ed349474db25", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.5964331264063312, "ground_truth": 0}, {"key": "bbe84a85e38aac4e2cff76da7ce4ed349474db25", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.17328820481830198, "ground_truth": 0}, {"key": "45884af9aff9abf54fec27f510c3f9ed000fc6e1", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.06853749555928888, "ground_truth": 0}, {"key": "45884af9aff9abf54fec27f510c3f9ed000fc6e1", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.1561048955095198, "ground_truth": 0}, {"key": "45884af9aff9abf54fec27f510c3f9ed000fc6e1", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.09670579210758247, "ground_truth": 0}, {"key": "45884af9aff9abf54fec27f510c3f9ed000fc6e1", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.03488088945318529, "ground_truth": 0}, {"key": "45884af9aff9abf54fec27f510c3f9ed000fc6e1", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.06656918542295401, "ground_truth": 0}, {"key": "59e60ba3c7ea5f5991db8ed4afd368c69e697dde", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.05460060675519891, "ground_truth": 0}, {"key": "59e60ba3c7ea5f5991db8ed4afd368c69e697dde", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.03963883853995425, "ground_truth": 0}, {"key": "59e60ba3c7ea5f5991db8ed4afd368c69e697dde", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.18126320726137554, "ground_truth": 0}, {"key": "59e60ba3c7ea5f5991db8ed4afd368c69e697dde", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.07159120024378922, "ground_truth": 0}, {"key": "59e60ba3c7ea5f5991db8ed4afd368c69e697dde", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.055412796439379144, "ground_truth": 0}, {"key": "265ad4cbd8cbad94527db327a39c2d8f33db33ce", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.09602549145131656, "ground_truth": 0}, {"key": "265ad4cbd8cbad94527db327a39c2d8f33db33ce", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.2101172616881183, "ground_truth": 0}, {"key": "265ad4cbd8cbad94527db327a39c2d8f33db33ce", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.11201595514945599, "ground_truth": 0}, {"key": "265ad4cbd8cbad94527db327a39c2d8f33db33ce", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.2845760097072656, "ground_truth": 0}, {"key": "265ad4cbd8cbad94527db327a39c2d8f33db33ce", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.15559099373589713, "ground_truth": 0}, {"key": "54e68f9b7cdd209c09b2a47feef62b9082346031", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.15102780650560405, "ground_truth": 0}, {"key": "54e68f9b7cdd209c09b2a47feef62b9082346031", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.25683199999677925, "ground_truth": 0}, {"key": "54e68f9b7cdd209c09b2a47feef62b9082346031", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.5717666128683946, "ground_truth": 0}, {"key": "54e68f9b7cdd209c09b2a47feef62b9082346031", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.15610489771727298, "ground_truth": 0}, {"key": "54e68f9b7cdd209c09b2a47feef62b9082346031", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.3157359721273053, "ground_truth": 0}, {"key": "3b5e3dff560e2233e8370c87e9d92461200f8bd4", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.12765261879180012, "ground_truth": 0}, {"key": "3b5e3dff560e2233e8370c87e9d92461200f8bd4", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.04922211326736236, "ground_truth": 0}, {"key": "3b5e3dff560e2233e8370c87e9d92461200f8bd4", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.1059482766600327, "ground_truth": 0}, {"key": "3b5e3dff560e2233e8370c87e9d92461200f8bd4", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.14128141715295514, "ground_truth": 0}, {"key": "3b5e3dff560e2233e8370c87e9d92461200f8bd4", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.0625597288822217, "ground_truth": 0}, {"key": "242c51d129c998a2585feee12e109a2058eb7c2b", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.12252321275984725, "ground_truth": 0}, {"key": "242c51d129c998a2585feee12e109a2058eb7c2b", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.13753247708565394, "ground_truth": 0}, {"key": "242c51d129c998a2585feee12e109a2058eb7c2b", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.0546006043809462, "ground_truth": 0}, {"key": "242c51d129c998a2585feee12e109a2058eb7c2b", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.10818895944997481, "ground_truth": 0}, {"key": "242c51d129c998a2585feee12e109a2058eb7c2b", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.060975183571876854, "ground_truth": 0}, {"key": "5ce92746bc1f4f5cbb25956c1289ffcd7f50f07e", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.11124121185441983, "ground_truth": 0}, {"key": "5ce92746bc1f4f5cbb25956c1289ffcd7f50f07e", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.24364246035057863, "ground_truth": 0}, {"key": "5ce92746bc1f4f5cbb25956c1289ffcd7f50f07e", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.18359362422681877, "ground_truth": 0}, {"key": "5ce92746bc1f4f5cbb25956c1289ffcd7f50f07e", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.25312183076912903, "ground_truth": 0}, {"key": "5ce92746bc1f4f5cbb25956c1289ffcd7f50f07e", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.3665897357974077, "ground_truth": 0}, {"key": "2f32a9eebbfa707a264d82a3bef5557f6b3b5f20", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.0568615518280473, "ground_truth": 0}, {"key": "2f32a9eebbfa707a264d82a3bef5557f6b3b5f20", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.05964694097796632, "ground_truth": 0}, {"key": "2f32a9eebbfa707a264d82a3bef5557f6b3b5f20", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.16885695987985497, "ground_truth": 0}, {"key": "2f32a9eebbfa707a264d82a3bef5557f6b3b5f20", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.16451645526666525, "ground_truth": 0}, {"key": "2f32a9eebbfa707a264d82a3bef5557f6b3b5f20", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.024237633371039992, "ground_truth": 0}, {"key": "57a373fa7d17600396fcee99164e79c0edccad14", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.11838509341369917, "ground_truth": 0}, {"key": "57a373fa7d17600396fcee99164e79c0edccad14", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.3123700249240595, "ground_truth": 0}, {"key": "57a373fa7d17600396fcee99164e79c0edccad14", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.21469140911809748, "ground_truth": 0}, {"key": "57a373fa7d17600396fcee99164e79c0edccad14", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.13753247563512094, "ground_truth": 0}, {"key": "57a373fa7d17600396fcee99164e79c0edccad14", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.1778108774977568, "ground_truth": 0}, {"key": "9b087c5572cc091c519625d37d1a614b97b8ed30", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.25832597650762046, "ground_truth": 0}, {"key": "9b087c5572cc091c519625d37d1a614b97b8ed30", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.06828853886833142, "ground_truth": 0}, {"key": "9b087c5572cc091c519625d37d1a614b97b8ed30", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.1859471934576072, "ground_truth": 0}, {"key": "9b087c5572cc091c519625d37d1a614b97b8ed30", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.33458942676703235, "ground_truth": 0}, {"key": "9b087c5572cc091c519625d37d1a614b97b8ed30", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.29746994104734126, "ground_truth": 0}, {"key": "b5211115ff68e12e759a474a02d3b163211af563", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.05419873117788161, "ground_truth": 0}, {"key": "b5211115ff68e12e759a474a02d3b163211af563", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.048136771779895594, "ground_truth": 0}, {"key": "b5211115ff68e12e759a474a02d3b163211af563", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.09268777573276211, "ground_truth": 0}, {"key": "b5211115ff68e12e759a474a02d3b163211af563", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.27669053403287347, "ground_truth": 0}, {"key": "b5211115ff68e12e759a474a02d3b163211af563", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.06560483670246224, "ground_truth": 0}, {"key": "6b75abea2de5c9c9952af0427ccec78910ac811f", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.32423539162930687, "ground_truth": 0}, {"key": "6b75abea2de5c9c9952af0427ccec78910ac811f", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.18713269039292024, "ground_truth": 0}, {"key": "6b75abea2de5c9c9952af0427ccec78910ac811f", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.08819004221870536, "ground_truth": 0}, {"key": "6b75abea2de5c9c9952af0427ccec78910ac811f", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.34687308039739906, "ground_truth": 0}, {"key": "6b75abea2de5c9c9952af0427ccec78910ac811f", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.09467769989754392, "ground_truth": 0}, {"key": "259cc1db3d4c814dafc02ed071327f65a7b9eaad", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.06233103769423321, "ground_truth": 0}, {"key": "259cc1db3d4c814dafc02ed071327f65a7b9eaad", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.03358950831390814, "ground_truth": 0}, {"key": "259cc1db3d4c814dafc02ed071327f65a7b9eaad", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.07477004769460055, "ground_truth": 0}, {"key": "259cc1db3d4c814dafc02ed071327f65a7b9eaad", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.24798744293941935, "ground_truth": 0}, {"key": "259cc1db3d4c814dafc02ed071327f65a7b9eaad", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.06632687161883077, "ground_truth": 0}, {"key": "3bb1cda1e01cb6e14f6190ced3b1ec3f7ef50de9", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.332852345639486, "ground_truth": 0}, {"key": "3bb1cda1e01cb6e14f6190ced3b1ec3f7ef50de9", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.11279540006907031, "ground_truth": 0}, {"key": "3bb1cda1e01cb6e14f6190ced3b1ec3f7ef50de9", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.04995852215352868, "ground_truth": 0}, {"key": "3bb1cda1e01cb6e14f6190ced3b1ec3f7ef50de9", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.0987725863901353, "ground_truth": 0}, {"key": "3bb1cda1e01cb6e14f6190ced3b1ec3f7ef50de9", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.29421496719468077, "ground_truth": 0}, {"key": "7afbe903f1f7cdc1af509583649babf481d01729", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.0335895082292891, "ground_truth": 0}, {"key": "7afbe903f1f7cdc1af509583649babf481d01729", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.06142403800708055, "ground_truth": 0}, {"key": "7afbe903f1f7cdc1af509583649babf481d01729", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.12506538658830832, "ground_truth": 0}, {"key": "7afbe903f1f7cdc1af509583649babf481d01729", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.2407746008651206, "ground_truth": 0}, {"key": "7afbe903f1f7cdc1af509583649babf481d01729", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.10894503972134728, "ground_truth": 0}, {"key": "79d625a3311f4ff11598a3ae4fca63103e84e9a1", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.02887090905281728, "ground_truth": 0}, {"key": "79d625a3311f4ff11598a3ae4fca63103e84e9a1", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.024892803238789108, "ground_truth": 0}, {"key": "79d625a3311f4ff11598a3ae4fca63103e84e9a1", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.09807933054338856, "ground_truth": 0}, {"key": "79d625a3311f4ff11598a3ae4fca63103e84e9a1", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.022802636344176258, "ground_truth": 0}, {"key": "79d625a3311f4ff11598a3ae4fca63103e84e9a1", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.23091976533449923, "ground_truth": 0}, {"key": "ea6c4267f17d55f1bd9f0950c31ef59565bdc30b", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.16559311627634749, "ground_truth": 0}, {"key": "ea6c4267f17d55f1bd9f0950c31ef59565bdc30b", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.1515293464763835, "ground_truth": 0}, {"key": "ea6c4267f17d55f1bd9f0950c31ef59565bdc30b", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.19193279685578266, "ground_truth": 0}, {"key": "ea6c4267f17d55f1bd9f0950c31ef59565bdc30b", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.17217185980808622, "ground_truth": 0}, {"key": "ea6c4267f17d55f1bd9f0950c31ef59565bdc30b", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.08509904070153364, "ground_truth": 0}, {"key": "851d02b689bec14607574096bb77b9acf53c15ee", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.054802593184647606, "ground_truth": 0}, {"key": "851d02b689bec14607574096bb77b9acf53c15ee", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.15817435374768532, "ground_truth": 0}, {"key": "851d02b689bec14607574096bb77b9acf53c15ee", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.12984343133685283, "ground_truth": 0}, {"key": "851d02b689bec14607574096bb77b9acf53c15ee", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.12043880814940318, "ground_truth": 0}, {"key": "851d02b689bec14607574096bb77b9acf53c15ee", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.04672495601583351, "ground_truth": 0}, {"key": "f2d00c8c396698becc18fd2b41ba595c7a3e1cc6", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.4902356279202538, "ground_truth": 0}, {"key": "f2d00c8c396698becc18fd2b41ba595c7a3e1cc6", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.868826776794025, "ground_truth": 0}, {"key": "f2d00c8c396698becc18fd2b41ba595c7a3e1cc6", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.7563575578441284, "ground_truth": 0}, {"key": "f2d00c8c396698becc18fd2b41ba595c7a3e1cc6", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.46879061235407243, "ground_truth": 0}, {"key": "f2d00c8c396698becc18fd2b41ba595c7a3e1cc6", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.6513548595057944, "ground_truth": 0}, {"key": "70c6ca3234f9b1221c8aea7671dd78e1ca9d9139", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.4282334060047132, "ground_truth": 0}, {"key": "70c6ca3234f9b1221c8aea7671dd78e1ca9d9139", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.25832598027375653, "ground_truth": 0}, {"key": "70c6ca3234f9b1221c8aea7671dd78e1ca9d9139", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.33633103999585495, "ground_truth": 0}, {"key": "70c6ca3234f9b1221c8aea7671dd78e1ca9d9139", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.6206215923017864, "ground_truth": 0}, {"key": "70c6ca3234f9b1221c8aea7671dd78e1ca9d9139", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.2674081535278094, "ground_truth": 0}, {"key": "86eaa90c419d5ed93341248fecd8c25d820f2b82", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.41300357193093995, "ground_truth": 0}, {"key": "86eaa90c419d5ed93341248fecd8c25d820f2b82", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.5669778176930524, "ground_truth": 0}, {"key": "86eaa90c419d5ed93341248fecd8c25d820f2b82", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.07237401623892643, "ground_truth": 0}, {"key": "86eaa90c419d5ed93341248fecd8c25d820f2b82", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.3451052801145453, "ground_truth": 0}, {"key": "86eaa90c419d5ed93341248fecd8c25d820f2b82", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.4378235139417255, "ground_truth": 0}, {"key": "a1841cf61c53937fffc54c0e81d8f7cfcad2f0c2", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.033336825879522004, "ground_truth": 0}, {"key": "a1841cf61c53937fffc54c0e81d8f7cfcad2f0c2", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.08725224284045491, "ground_truth": 0}, {"key": "a1841cf61c53937fffc54c0e81d8f7cfcad2f0c2", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.09401018498842371, "ground_truth": 0}, {"key": "a1841cf61c53937fffc54c0e81d8f7cfcad2f0c2", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.10411240556013736, "ground_truth": 0}, {"key": "a1841cf61c53937fffc54c0e81d8f7cfcad2f0c2", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.13072868685608113, "ground_truth": 0}, {"key": "5d221c86fdadca378eeaabc39c881cc74efcff07", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.007999754460493466, "ground_truth": 0}, {"key": "5d221c86fdadca378eeaabc39c881cc74efcff07", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.07640768434590957, "ground_truth": 0}, {"key": "5d221c86fdadca378eeaabc39c881cc74efcff07", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.04161779274522845, "ground_truth": 0}, {"key": "5d221c86fdadca378eeaabc39c881cc74efcff07", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.01406362728430538, "ground_truth": 0}, {"key": "5d221c86fdadca378eeaabc39c881cc74efcff07", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.06097518674896927, "ground_truth": 0}, {"key": "7a49f5bc1d336309f57076bceba91885ee5368b5", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.34687307293187775, "ground_truth": 0}, {"key": "7a49f5bc1d336309f57076bceba91885ee5368b5", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.22000709707362098, "ground_truth": 0}, {"key": "7a49f5bc1d336309f57076bceba91885ee5368b5", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.4130035863289713, "ground_truth": 0}, {"key": "7a49f5bc1d336309f57076bceba91885ee5368b5", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.2782567956986156, "ground_truth": 0}, {"key": "7a49f5bc1d336309f57076bceba91885ee5368b5", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.401687806325171, "ground_truth": 0}, {"key": "dd46893fd318dce4e209f9a335612659ebf8fd24", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.10302442649831939, "ground_truth": 0}, {"key": "dd46893fd318dce4e209f9a335612659ebf8fd24", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.12294379720730732, "ground_truth": 0}, {"key": "dd46893fd318dce4e209f9a335612659ebf8fd24", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.01979477982141912, "ground_truth": 0}, {"key": "dd46893fd318dce4e209f9a335612659ebf8fd24", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.11716747127929517, "ground_truth": 0}, {"key": "dd46893fd318dce4e209f9a335612659ebf8fd24", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.08787644424424128, "ground_truth": 0}, {"key": "acda8749fba5e9553e9f47cef89ef85eae5ad4e3", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.022629200087417478, "ground_truth": 0}, {"key": "acda8749fba5e9553e9f47cef89ef85eae5ad4e3", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.016090874549456378, "ground_truth": 0}, {"key": "acda8749fba5e9553e9f47cef89ef85eae5ad4e3", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.01724277664575687, "ground_truth": 0}, {"key": "acda8749fba5e9553e9f47cef89ef85eae5ad4e3", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.005533388002242318, "ground_truth": 0}, {"key": "acda8749fba5e9553e9f47cef89ef85eae5ad4e3", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.023509452226958, "ground_truth": 0}, {"key": "20b11518df6520f552d691d5f6c0d02755d11809", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.16776334255689693, "ground_truth": 0}, {"key": "20b11518df6520f552d691d5f6c0d02755d11809", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.11516224033415542, "ground_truth": 0}, {"key": "20b11518df6520f552d691d5f6c0d02755d11809", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.2782567951766199, "ground_truth": 0}, {"key": "20b11518df6520f552d691d5f6c0d02755d11809", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.3702253802540607, "ground_truth": 0}, {"key": "20b11518df6520f552d691d5f6c0d02755d11809", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.32252599375199087, "ground_truth": 0}, {"key": "51fe083191bb5568bf6a5fea1610a8e19663d7b2", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.12506538481657722, "ground_truth": 0}, {"key": "51fe083191bb5568bf6a5fea1610a8e19663d7b2", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.06418264069676524, "ground_truth": 0}, {"key": "51fe083191bb5568bf6a5fea1610a8e19663d7b2", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.04272219667755519, "ground_truth": 0}, {"key": "51fe083191bb5568bf6a5fea1610a8e19663d7b2", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.020023439663718456, "ground_truth": 0}, {"key": "51fe083191bb5568bf6a5fea1610a8e19663d7b2", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.051653785773715925, "ground_truth": 0}, {"key": "8af047c2d83a91e8b745adfcaa7c282dfe1030a2", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.03690806795532124, "ground_truth": 0}, {"key": "8af047c2d83a91e8b745adfcaa7c282dfe1030a2", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.16667540764915822, "ground_truth": 0}, {"key": "8af047c2d83a91e8b745adfcaa7c282dfe1030a2", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.06681232800144773, "ground_truth": 0}, {"key": "8af047c2d83a91e8b745adfcaa7c282dfe1030a2", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.12168575804512372, "ground_truth": 0}, {"key": "8af047c2d83a91e8b745adfcaa7c282dfe1030a2", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.17553807177488934, "ground_truth": 0}, {"key": "dfcacd955a9168b2cf599c57a539dbfce43ea2a9", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.5136684643508007, "ground_truth": 0}, {"key": "dfcacd955a9168b2cf599c57a539dbfce43ea2a9", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.31405053301241415, "ground_truth": 0}, {"key": "dfcacd955a9168b2cf599c57a539dbfce43ea2a9", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.842345095773147, "ground_truth": 0}, {"key": "dfcacd955a9168b2cf599c57a539dbfce43ea2a9", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.5563995737070605, "ground_truth": 0}, {"key": "dfcacd955a9168b2cf599c57a539dbfce43ea2a9", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.7924642649544856, "ground_truth": 0}, {"key": "f2463954bc7215d8a1f98cf0d85f280fd2affa58", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.18832398292724303, "ground_truth": 0}, {"key": "f2463954bc7215d8a1f98cf0d85f280fd2affa58", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.13206615309039343, "ground_truth": 0}, {"key": "f2463954bc7215d8a1f98cf0d85f280fd2affa58", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.1192029174129566, "ground_truth": 0}, {"key": "f2463954bc7215d8a1f98cf0d85f280fd2affa58", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.08570927570799158, "ground_truth": 0}, {"key": "f2463954bc7215d8a1f98cf0d85f280fd2affa58", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.05707139957368672, "ground_truth": 0}, {"key": "0e7a92a6f06e94cdd613860d4a3f4b92a06a2b43", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.016979992139895643, "ground_truth": 0}, {"key": "0e7a92a6f06e94cdd613860d4a3f4b92a06a2b43", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.03622006041405638, "ground_truth": 0}, {"key": "0e7a92a6f06e94cdd613860d4a3f4b92a06a2b43", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.010944578317822345, "ground_truth": 0}, {"key": "0e7a92a6f06e94cdd613860d4a3f4b92a06a2b43", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.003824483827027668, "ground_truth": 0}, {"key": "0e7a92a6f06e94cdd613860d4a3f4b92a06a2b43", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.01840489084215889, "ground_truth": 0}, {"key": "2905a15c5947042e42f4b52dc201d24822af20f1", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.13386749591912217, "ground_truth": 0}, {"key": "2905a15c5947042e42f4b52dc201d24822af20f1", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.33111974590212123, "ground_truth": 0}, {"key": "2905a15c5947042e42f4b52dc201d24822af20f1", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.09203285802476414, "ground_truth": 0}, {"key": "2905a15c5947042e42f4b52dc201d24822af20f1", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.106690590814209, "ground_truth": 0}, {"key": "2905a15c5947042e42f4b52dc201d24822af20f1", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.28457601263115606, "ground_truth": 0}, {"key": "808a3d788317af05686ee71a71d2fbc5c19267bc", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.031026179860801775, "ground_truth": 0}, {"key": "808a3d788317af05686ee71a71d2fbc5c19267bc", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.0394904036250735, "ground_truth": 0}, {"key": "808a3d788317af05686ee71a71d2fbc5c19267bc", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.017375665169515025, "ground_truth": 0}, {"key": "808a3d788317af05686ee71a71d2fbc5c19267bc", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.01840489091002874, "ground_truth": 0}, {"key": "808a3d788317af05686ee71a71d2fbc5c19267bc", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.043691060430423416, "ground_truth": 0}, {"key": "5a1bec30205b6938392f3119366e27d15b4849e8", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.17895590489339894, "ground_truth": 0}, {"key": "5a1bec30205b6938392f3119366e27d15b4849e8", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.3157359794632318, "ground_truth": 0}, {"key": "5a1bec30205b6938392f3119366e27d15b4849e8", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.1623800279747445, "ground_truth": 0}, {"key": "5a1bec30205b6938392f3119366e27d15b4849e8", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.33111974093113744, "ground_truth": 0}, {"key": "5a1bec30205b6938392f3119366e27d15b4849e8", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.29910518452125057, "ground_truth": 0}, {"key": "7ff39e1220c0f084434786ed145e15c6abe48def", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.1352320755982787, "ground_truth": 0}, {"key": "7ff39e1220c0f084434786ed145e15c6abe48def", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.32252600125842634, "ground_truth": 0}, {"key": "7ff39e1220c0f084434786ed145e15c6abe48def", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.34158249995765544, "ground_truth": 0}, {"key": "7ff39e1220c0f084434786ed145e15c6abe48def", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.11676401864026842, "ground_truth": 0}, {"key": "7ff39e1220c0f084434786ed145e15c6abe48def", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.11357959176868757, "ground_truth": 0}, {"key": "7551503e7e57bd519913b0df90ca1e80d5305b05", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.20561504631525707, "ground_truth": 0}, {"key": "7551503e7e57bd519913b0df90ca1e80d5305b05", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.5175708937955067, "ground_truth": 0}, {"key": "7551503e7e57bd519913b0df90ca1e80d5305b05", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.5448014093678416, "ground_truth": 0}, {"key": "7551503e7e57bd519913b0df90ca1e80d5305b05", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.5602526618619132, "ground_truth": 0}, {"key": "7551503e7e57bd519913b0df90ca1e80d5305b05", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.35220178282848225, "ground_truth": 0}, {"key": "c34a0cbf6db61323766fc86b1b89b399ff6b0666", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.8459424381123668, "ground_truth": 0}, {"key": "c34a0cbf6db61323766fc86b1b89b399ff6b0666", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.7325918345732223, "ground_truth": 0}, {"key": "c34a0cbf6db61323766fc86b1b89b399ff6b0666", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.8587185866712995, "ground_truth": 0}, {"key": "c34a0cbf6db61323766fc86b1b89b399ff6b0666", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.8976953025067081, "ground_truth": 0}, {"key": "c34a0cbf6db61323766fc86b1b89b399ff6b0666", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.6187804387866188, "ground_truth": 0}, {"key": "d07a61368a195444b14bd4b382e0fc3d64890b22", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.28298813654148475, "ground_truth": 0}, {"key": "d07a61368a195444b14bd4b382e0fc3d64890b22", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.3363310505849187, "ground_truth": 0}, {"key": "d07a61368a195444b14bd4b382e0fc3d64890b22", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.26284184475842265, "ground_truth": 0}, {"key": "d07a61368a195444b14bd4b382e0fc3d64890b22", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.24653335732897294, "ground_truth": 0}, {"key": "d07a61368a195444b14bd4b382e0fc3d64890b22", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.26284185277277705, "ground_truth": 0}, {"key": "aa68dee4bc246e5aae9507342f8520a2a301a310", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.08540366975644736, "ground_truth": 0}, {"key": "aa68dee4bc246e5aae9507342f8520a2a301a310", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.19132769273787958, "ground_truth": 0}, {"key": "aa68dee4bc246e5aae9507342f8520a2a301a310", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.13846179634565353, "ground_truth": 0}, {"key": "aa68dee4bc246e5aae9507342f8520a2a301a310", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.09268778245753283, "ground_truth": 0}, {"key": "aa68dee4bc246e5aae9507342f8520a2a301a310", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.0792103197960812, "ground_truth": 0}, {"key": "87ef15064035db73cb29f5cec2f0442f2c527ef0", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.021948255133708617, "ground_truth": 0}, {"key": "87ef15064035db73cb29f5cec2f0442f2c527ef0", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.034618839209629604, "ground_truth": 0}, {"key": "87ef15064035db73cb29f5cec2f0442f2c527ef0", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.005001672503573349, "ground_truth": 0}, {"key": "87ef15064035db73cb29f5cec2f0442f2c527ef0", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.004718369261013236, "ground_truth": 0}, {"key": "87ef15064035db73cb29f5cec2f0442f2c527ef0", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.0033244367172826374, "ground_truth": 0}, {"key": "a577b934e210ef7dce07390711f03db8bb2e005a", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.03554439896410239, "ground_truth": 0}, {"key": "a577b934e210ef7dce07390711f03db8bb2e005a", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.09467769802096528, "ground_truth": 0}, {"key": "a577b934e210ef7dce07390711f03db8bb2e005a", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.07316472108510741, "ground_truth": 0}, {"key": "a577b934e210ef7dce07390711f03db8bb2e005a", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.03904829187993395, "ground_truth": 0}, {"key": "a577b934e210ef7dce07390711f03db8bb2e005a", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.08151975828372145, "ground_truth": 0}, {"key": "c9414bf55859cb9ca7e925a4a09b416b6f66446a", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.5851011412233647, "ground_truth": 0}, {"key": "c9414bf55859cb9ca7e925a4a09b416b6f66446a", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.6731916570731415, "ground_truth": 0}, {"key": "c9414bf55859cb9ca7e925a4a09b416b6f66446a", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.5698526609268576, "ground_truth": 0}, {"key": "c9414bf55859cb9ca7e925a4a09b416b6f66446a", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.44360041335786954, "ground_truth": 0}, {"key": "c9414bf55859cb9ca7e925a4a09b416b6f66446a", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.5448013916196093, "ground_truth": 0}, {"key": "f12cda150b96acfa1499b2afb0a81029545abadf", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.36477755181564775, "ground_truth": 0}, {"key": "f12cda150b96acfa1499b2afb0a81029545abadf", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.49023561313595515, "ground_truth": 0}, {"key": "f12cda150b96acfa1499b2afb0a81029545abadf", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.27048021681193535, "ground_truth": 0}, {"key": "f12cda150b96acfa1499b2afb0a81029545abadf", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.4282333805313125, "ground_truth": 0}, {"key": "f12cda150b96acfa1499b2afb0a81029545abadf", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.7512833910356504, "ground_truth": 0}, {"key": "7359741b0e60b4402f069963a26c7aa766f45e7c", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.16132022903417315, "ground_truth": 0}, {"key": "7359741b0e60b4402f069963a26c7aa766f45e7c", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.03448852341760984, "ground_truth": 0}, {"key": "7359741b0e60b4402f069963a26c7aa766f45e7c", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.0847954053319519, "ground_truth": 0}, {"key": "7359741b0e60b4402f069963a26c7aa766f45e7c", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.23510838412499357, "ground_truth": 0}, {"key": "7359741b0e60b4402f069963a26c7aa766f45e7c", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.0797820187173466, "ground_truth": 0}, {"key": "b10c71f49dbeabad23325d625e8e7b8529429607", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.259825649396885, "ground_truth": 0}, {"key": "b10c71f49dbeabad23325d625e8e7b8529429607", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.11201596017276037, "ground_truth": 0}, {"key": "b10c71f49dbeabad23325d625e8e7b8529429607", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.14223189108784293, "ground_truth": 0}, {"key": "b10c71f49dbeabad23325d625e8e7b8529429607", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.06465349121329719, "ground_truth": 0}, {"key": "b10c71f49dbeabad23325d625e8e7b8529429607", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.09467770480354985, "ground_truth": 0}, {"key": "c5a1e04f5f84d406ffedfc2f312c314d1bc03c46", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.09670578951136155, "ground_truth": 0}, {"key": "c5a1e04f5f84d406ffedfc2f312c314d1bc03c46", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.03358950828229638, "ground_truth": 0}, {"key": "c5a1e04f5f84d406ffedfc2f312c314d1bc03c46", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.15152934426999154, "ground_truth": 0}, {"key": "c5a1e04f5f84d406ffedfc2f312c314d1bc03c46", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.11516223603733214, "ground_truth": 0}, {"key": "c5a1e04f5f84d406ffedfc2f312c314d1bc03c46", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.02645577818476829, "ground_truth": 0}, {"key": "8a5035d3527c4db4357dd1db9fb2712008dccea9", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.06325052417394764, "ground_truth": 0}, {"key": "8a5035d3527c4db4357dd1db9fb2712008dccea9", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.06255972947795976, "ground_truth": 0}, {"key": "8a5035d3527c4db4357dd1db9fb2712008dccea9", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.309023714459953, "ground_truth": 0}, {"key": "8a5035d3527c4db4357dd1db9fb2712008dccea9", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.08093671099227887, "ground_truth": 0}, {"key": "8a5035d3527c4db4357dd1db9fb2712008dccea9", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.10302442412800183, "ground_truth": 0}, {"key": "3f33d4cb25cd121619ba99eeb02709b72716d622", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.19930801444643065, "ground_truth": 0}, {"key": "3f33d4cb25cd121619ba99eeb02709b72716d622", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.7341195172756602, "ground_truth": 0}, {"key": "3f33d4cb25cd121619ba99eeb02709b72716d622", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.6976089055144132, "ground_truth": 0}, {"key": "3f33d4cb25cd121619ba99eeb02709b72716d622", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.5851011556727124, "ground_truth": 0}, {"key": "3f33d4cb25cd121619ba99eeb02709b72716d622", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.684264015950271, "ground_truth": 0}, {"key": "e6f451d6667f142a64818a9d05dbc49115e7cbf9", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.3942009293213062, "ground_truth": 0}, {"key": "e6f451d6667f142a64818a9d05dbc49115e7cbf9", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.8376199562146425, "ground_truth": 0}, {"key": "e6f451d6667f142a64818a9d05dbc49115e7cbf9", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.6548947144876512, "ground_truth": 0}, {"key": "e6f451d6667f142a64818a9d05dbc49115e7cbf9", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.1666754017032478, "ground_truth": 0}, {"key": "e6f451d6667f142a64818a9d05dbc49115e7cbf9", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.35220177405679753, "ground_truth": 0}, {"key": "39622c01625247af942a6439699ff529db1d54d0", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.06348236028655997, "ground_truth": 0}, {"key": "39622c01625247af942a6439699ff529db1d54d0", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.10818895782024673, "ground_truth": 0}, {"key": "39622c01625247af942a6439699ff529db1d54d0", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.15507848097656643, "ground_truth": 0}, {"key": "39622c01625247af942a6439699ff529db1d54d0", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.05813159360309974, "ground_truth": 0}, {"key": "39622c01625247af942a6439699ff529db1d54d0", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.0758581759488746, "ground_truth": 0}, {"key": "02927c88776bcc84fc883435a5037b4c8ca70e83", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.42632159952519905, "ground_truth": 0}, {"key": "02927c88776bcc84fc883435a5037b4c8ca70e83", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.23792989696424371, "ground_truth": 0}, {"key": "02927c88776bcc84fc883435a5037b4c8ca70e83", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.0424038286758469, "ground_truth": 0}, {"key": "02927c88776bcc84fc883435a5037b4c8ca70e83", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.3504213775395547, "ground_truth": 0}, {"key": "02927c88776bcc84fc883435a5037b4c8ca70e83", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.024798162261063926, "ground_truth": 0}, {"key": "3ee31d8987c07ba4ea9423d39c5e333525316958", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.5727227869598561, "ground_truth": 0}, {"key": "3ee31d8987c07ba4ea9423d39c5e333525316958", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.754191528598023, "ground_truth": 0}, {"key": "3ee31d8987c07ba4ea9423d39c5e333525316958", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.7779753207476178, "ground_truth": 0}, {"key": "3ee31d8987c07ba4ea9423d39c5e333525316958", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.42250464208011984, "ground_truth": 0}, {"key": "3ee31d8987c07ba4ea9423d39c5e333525316958", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.46587345428729504, "ground_truth": 0}, {"key": "f8ddc6d36f378757d27a244529f8fe11672baa41", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.01634012763032922, "ground_truth": 0}, {"key": "f8ddc6d36f378757d27a244529f8fe11672baa41", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.08632347442299283, "ground_truth": 0}, {"key": "f8ddc6d36f378757d27a244529f8fe11672baa41", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.0764076779159181, "ground_truth": 0}, {"key": "f8ddc6d36f378757d27a244529f8fe11672baa41", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.02615561982158148, "ground_truth": 0}, {"key": "f8ddc6d36f378757d27a244529f8fe11672baa41", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.05379964112839021, "ground_truth": 0}, {"key": "4e97228ceef1be54ab9151fc6759017e6a54a18d", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.05541279048649454, "ground_truth": 0}, {"key": "4e97228ceef1be54ab9151fc6759017e6a54a18d", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.12940273636936384, "ground_truth": 0}, {"key": "4e97228ceef1be54ab9151fc6759017e6a54a18d", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.038756194909264706, "ground_truth": 0}, {"key": "4e97228ceef1be54ab9151fc6759017e6a54a18d", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.03635666085200937, "ground_truth": 0}, {"key": "4e97228ceef1be54ab9151fc6759017e6a54a18d", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.020332353053928737, "ground_truth": 0}, {"key": "0e649ccabaf0e650e9757ee256c2749d37486ba6", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.10017222559137764, "ground_truth": 0}, {"key": "0e649ccabaf0e650e9757ee256c2749d37486ba6", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.02120612029461623, "ground_truth": 0}, {"key": "0e649ccabaf0e650e9757ee256c2749d37486ba6", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.06325052816008742, "ground_truth": 0}, {"key": "0e649ccabaf0e650e9757ee256c2749d37486ba6", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.15304215343880437, "ground_truth": 0}, {"key": "0e649ccabaf0e650e9757ee256c2749d37486ba6", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.07290026954186717, "ground_truth": 0}, {"key": "9eccfcc231c7c0d65cb0c333cb3d1731a5fe2f3f", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.29259529614025637, "ground_truth": 0}, {"key": "9eccfcc231c7c0d65cb0c333cb3d1731a5fe2f3f", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.4863315219055661, "ground_truth": 0}, {"key": "9eccfcc231c7c0d65cb0c333cb3d1731a5fe2f3f", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.25832596861443186, "ground_truth": 0}, {"key": "9eccfcc231c7c0d65cb0c333cb3d1731a5fe2f3f", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.0973903953790999, "ground_truth": 0}, {"key": "9eccfcc231c7c0d65cb0c333cb3d1731a5fe2f3f", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.3593641443230681, "ground_truth": 0}, {"key": "ddf109b3de6022a4ecd62ee2cd31d2c2ac51035b", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.3593641409592756, "ground_truth": 0}, {"key": "ddf109b3de6022a4ecd62ee2cd31d2c2ac51035b", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.3775406867220169, "ground_truth": 0}, {"key": "ddf109b3de6022a4ecd62ee2cd31d2c2ac51035b", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.32680831363527363, "ground_truth": 0}, {"key": "ddf109b3de6022a4ecd62ee2cd31d2c2ac51035b", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.700894814291387, "ground_truth": 0}, {"key": "ddf109b3de6022a4ecd62ee2cd31d2c2ac51035b", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.4824291185894685, "ground_truth": 0}, {"key": "bd92eab23374d95ac4430e2e1a8bf7561c662309", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.11516223396046718, "ground_truth": 0}, {"key": "bd92eab23374d95ac4430e2e1a8bf7561c662309", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.24077460369339843, "ground_truth": 0}, {"key": "bd92eab23374d95ac4430e2e1a8bf7561c662309", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.16344543048852125, "ground_truth": 0}, {"key": "bd92eab23374d95ac4430e2e1a8bf7561c662309", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.2018132229962308, "ground_truth": 0}, {"key": "bd92eab23374d95ac4430e2e1a8bf7561c662309", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.2479874361288614, "ground_truth": 0}, {"key": "d84440effc748f9220c7dde068962e803f566bc7", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.7490872119869955, "ground_truth": 0}, {"key": "d84440effc748f9220c7dde068962e803f566bc7", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.598312203383528, "ground_truth": 0}, {"key": "d84440effc748f9220c7dde068962e803f566bc7", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.4407099332748001, "ground_truth": 0}, {"key": "d84440effc748f9220c7dde068962e803f566bc7", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.41111086868866564, "ground_truth": 0}, {"key": "d84440effc748f9220c7dde068962e803f566bc7", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.6424324820310564, "ground_truth": 0}, {"key": "e2866f596c85b0191ce812260d23855c70a01192", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.3090236999019636, "ground_truth": 0}, {"key": "e2866f596c85b0191ce812260d23855c70a01192", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.2735743894568276, "ground_truth": 0}, {"key": "e2866f596c85b0191ce812260d23855c70a01192", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.19806416750650194, "ground_truth": 0}, {"key": "e2866f596c85b0191ce812260d23855c70a01192", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.31069437555991064, "ground_truth": 0}, {"key": "e2866f596c85b0191ce812260d23855c70a01192", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.29098085490893905, "ground_truth": 0}, {"key": "4ebd9195bc8c12272b6281a5a610a7b5fb49b8cd", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.7090191334613359, "ground_truth": 0}, {"key": "4ebd9195bc8c12272b6281a5a610a7b5fb49b8cd", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.49804686458820413, "ground_truth": 0}, {"key": "4ebd9195bc8c12272b6281a5a610a7b5fb49b8cd", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.759225411893055, "ground_truth": 0}, {"key": "4ebd9195bc8c12272b6281a5a610a7b5fb49b8cd", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.3979384263149225, "ground_truth": 0}, {"key": "4ebd9195bc8c12272b6281a5a610a7b5fb49b8cd", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.8140527903780576, "ground_truth": 0}, {"key": "4bd37aa7004cd1fdf1ccb506d2159a2cf26995e0", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.03501262783920278, "ground_truth": 0}, {"key": "4bd37aa7004cd1fdf1ccb506d2159a2cf26995e0", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.28616926195762066, "ground_truth": 0}, {"key": "4bd37aa7004cd1fdf1ccb506d2159a2cf26995e0", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.21076629756712584, "ground_truth": 0}, {"key": "4bd37aa7004cd1fdf1ccb506d2159a2cf26995e0", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.11279540158369517, "ground_truth": 0}, {"key": "4bd37aa7004cd1fdf1ccb506d2159a2cf26995e0", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.1710611851035119, "ground_truth": 0}, {"key": "29b87dc549b8c64b35517e684e79b1da6316bd88", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.32766829149661525, "ground_truth": 0}, {"key": "29b87dc549b8c64b35517e684e79b1da6316bd88", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.5832033416499481, "ground_truth": 0}, {"key": "29b87dc549b8c64b35517e684e79b1da6316bd88", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.3665897397569866, "ground_truth": 0}, {"key": "29b87dc549b8c64b35517e684e79b1da6316bd88", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.12592277620754008, "ground_truth": 0}, {"key": "29b87dc549b8c64b35517e684e79b1da6316bd88", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.39047584645493955, "ground_truth": 0}, {"key": "d2f2fe0b8797b416bae71305c9d1c874e2fdd0cc", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.018761083428529314, "ground_truth": 0}, {"key": "d2f2fe0b8797b416bae71305c9d1c874e2fdd0cc", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.09739039674005494, "ground_truth": 0}, {"key": "d2f2fe0b8797b416bae71305c9d1c874e2fdd0cc", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.026255300743831235, "ground_truth": 0}, {"key": "d2f2fe0b8797b416bae71305c9d1c874e2fdd0cc", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.07030384328506352, "ground_truth": 0}, {"key": "d2f2fe0b8797b416bae71305c9d1c874e2fdd0cc", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.03527754851012629, "ground_truth": 0}, {"key": "0269d39abbea3edadd225fa97d818f5a789b4c72", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.2538610134282009, "ground_truth": 0}, {"key": "0269d39abbea3edadd225fa97d818f5a789b4c72", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.3775406867220169, "ground_truth": 0}, {"key": "0269d39abbea3edadd225fa97d818f5a789b4c72", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.43782348938719806, "ground_truth": 0}, {"key": "0269d39abbea3edadd225fa97d818f5a789b4c72", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.6662796715871645, "ground_truth": 0}, {"key": "0269d39abbea3edadd225fa97d818f5a789b4c72", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.4416730034673395, "ground_truth": 0}, {"key": "394f20c9bee9bc8d0e6a65bac48de57bd9f4733d", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.016721142229987267, "ground_truth": 0}, {"key": "394f20c9bee9bc8d0e6a65bac48de57bd9f4733d", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.0389019815966655, "ground_truth": 0}, {"key": "394f20c9bee9bc8d0e6a65bac48de57bd9f4733d", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.0052608522824287825, "ground_truth": 0}, {"key": "394f20c9bee9bc8d0e6a65bac48de57bd9f4733d", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.038610929420527074, "ground_truth": 0}, {"key": "394f20c9bee9bc8d0e6a65bac48de57bd9f4733d", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.09501304458550618, "ground_truth": 0}, {"key": "6e63c8b1ae01ab91b4832222edaf4bb461b6c568", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.18359362862591194, "ground_truth": 0}, {"key": "6e63c8b1ae01ab91b4832222edaf4bb461b6c568", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.04146227615435998, "ground_truth": 0}, {"key": "6e63c8b1ae01ab91b4832222edaf4bb461b6c568", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.05108273629549683, "ground_truth": 0}, {"key": "6e63c8b1ae01ab91b4832222edaf4bb461b6c568", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.2043419166919658, "ground_truth": 0}, {"key": "6e63c8b1ae01ab91b4832222edaf4bb461b6c568", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.13660840185565792, "ground_truth": 0}, {"key": "355875856932fd634aaf7c6b26155403aaf15904", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.24220562767163553, "ground_truth": 0}, {"key": "355875856932fd634aaf7c6b26155403aaf15904", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.10594828296870885, "ground_truth": 0}, {"key": "355875856932fd634aaf7c6b26155403aaf15904", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.18713268821257154, "ground_truth": 0}, {"key": "355875856932fd634aaf7c6b26155403aaf15904", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.5832033440418386, "ground_truth": 0}, {"key": "355875856932fd634aaf7c6b26155403aaf15904", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.24364246110486312, "ground_truth": 0}, {"key": "999523913d281ab57977d79b644f3879ac4d2e37", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.16344542665739756, "ground_truth": 0}, {"key": "999523913d281ab57977d79b644f3879ac4d2e37", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.06512754881024996, "ground_truth": 0}, {"key": "999523913d281ab57977d79b644f3879ac4d2e37", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.09401018265505036, "ground_truth": 0}, {"key": "999523913d281ab57977d79b644f3879ac4d2e37", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.035012628421578075, "ground_truth": 0}, {"key": "999523913d281ab57977d79b644f3879ac4d2e37", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.05165378517789484, "ground_truth": 0}, {"key": "5f7424604ec11358dc6fdfa47732f90422949041", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.4282333884802706, "ground_truth": 0}, {"key": "5f7424604ec11358dc6fdfa47732f90422949041", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.036220060208176086, "ground_truth": 0}, {"key": "5f7424604ec11358dc6fdfa47732f90422949041", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.08913693443335344, "ground_truth": 0}, {"key": "5f7424604ec11358dc6fdfa47732f90422949041", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.4244119910371958, "ground_truth": 0}, {"key": "5f7424604ec11358dc6fdfa47732f90422949041", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.05014424915073125, "ground_truth": 0}, {"key": "fdb2b65b9cb99b7d52559ae647cae293cb5910d3", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.05184546652062029, "ground_truth": 0}, {"key": "fdb2b65b9cb99b7d52559ae647cae293cb5910d3", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.008348054439148486, "ground_truth": 0}, {"key": "fdb2b65b9cb99b7d52559ae647cae293cb5910d3", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.012288597086884387, "ground_truth": 0}, {"key": "fdb2b65b9cb99b7d52559ae647cae293cb5910d3", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.004848533015128272, "ground_truth": 0}, {"key": "fdb2b65b9cb99b7d52559ae647cae293cb5910d3", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.007431772928480712, "ground_truth": 0}, {"key": "f974fe1b3777ffc5756322c0bb3f31a9b23ec09a", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.10447731720474766, "ground_truth": 0}, {"key": "f974fe1b3777ffc5756322c0bb3f31a9b23ec09a", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.026056303610701607, "ground_truth": 0}, {"key": "f974fe1b3777ffc5756322c0bb3f31a9b23ec09a", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.017780389226092864, "ground_truth": 0}, {"key": "f974fe1b3777ffc5756322c0bb3f31a9b23ec09a", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.027376489216235107, "ground_truth": 0}, {"key": "f974fe1b3777ffc5756322c0bb3f31a9b23ec09a", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.046899260226012346, "ground_truth": 0}, {"key": "2930e1a7ac24bce649bfbf5f5971e74515e38a0a", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.11676400723242215, "ground_truth": 0}, {"key": "2930e1a7ac24bce649bfbf5f5971e74515e38a0a", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.0670562895110844, "ground_truth": 0}, {"key": "2930e1a7ac24bce649bfbf5f5971e74515e38a0a", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.06853748973335652, "ground_truth": 0}, {"key": "2930e1a7ac24bce649bfbf5f5971e74515e38a0a", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.07081619694839195, "ground_truth": 0}, {"key": "2930e1a7ac24bce649bfbf5f5971e74515e38a0a", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.04689926295118442, "ground_truth": 0}, {"key": "f5f7571a69e96c1d288d939861b7216c2bdc0ae4", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.07081619580488699, "ground_truth": 0}, {"key": "f5f7571a69e96c1d288d939861b7216c2bdc0ae4", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.3720487839985232, "ground_truth": 0}, {"key": "f5f7571a69e96c1d288d939861b7216c2bdc0ae4", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.3380771273400633, "ground_truth": 0}, {"key": "f5f7571a69e96c1d288d939861b7216c2bdc0ae4", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.23651622846617135, "ground_truth": 0}, {"key": "f5f7571a69e96c1d288d939861b7216c2bdc0ae4", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.15253650854311773, "ground_truth": 0}, {"key": "5f02aa32bd1dc95e47355755398e31550b232f8a", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.14033624775221526, "ground_truth": 0}, {"key": "5f02aa32bd1dc95e47355755398e31550b232f8a", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.1650540903277886, "ground_truth": 0}, {"key": "5f02aa32bd1dc95e47355755398e31550b232f8a", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.39140593446236305, "ground_truth": 0}, {"key": "5f02aa32bd1dc95e47355755398e31550b232f8a", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.22884513695270767, "ground_truth": 0}, {"key": "5f02aa32bd1dc95e47355755398e31550b232f8a", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.9145963371877369, "ground_truth": 0}, {"key": "9177e5ac94f038749e8d4eb526a65461e0f6df4c", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.1694058683736672, "ground_truth": 0}, {"key": "9177e5ac94f038749e8d4eb526a65461e0f6df4c", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.2068940547631557, "ground_truth": 0}, {"key": "9177e5ac94f038749e8d4eb526a65461e0f6df4c", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.28298812837022413, "ground_truth": 0}, {"key": "9177e5ac94f038749e8d4eb526a65461e0f6df4c", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.16505408405905608, "ground_truth": 0}, {"key": "9177e5ac94f038749e8d4eb526a65461e0f6df4c", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.25534364097578, "ground_truth": 0}, {"key": "f12e4bbb07211de7d43b4e331dc73404aa804562", "model": "xsum_500_ft_llama", "target_model": "llama", "recognition_score": 0.9102267104968432, "ground_truth": 0}, {"key": "f12e4bbb07211de7d43b4e331dc73404aa804562", "model": "xsum_500_ft_llama", "target_model": "human", "recognition_score": 0.9676556691797809, "ground_truth": 0}, {"key": "f12e4bbb07211de7d43b4e331dc73404aa804562", "model": "xsum_500_ft_llama", "target_model": "claude", "recognition_score": 0.921074121162329, "ground_truth": 0}, {"key": "f12e4bbb07211de7d43b4e331dc73404aa804562", "model": "xsum_500_ft_llama", "target_model": "gpt4", "recognition_score": 0.7512833897734964, "ground_truth": 0}, {"key": "f12e4bbb07211de7d43b4e331dc73404aa804562", "model": "xsum_500_ft_llama", "target_model": "gpt35", "recognition_score": 0.9175985079693455, "ground_truth": 0}]