[{"key": "42c027e4ff9730fbb3de84c1af0d2c506e41c3e4", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.8998277754516503, "ground_truth": 0}, {"key": "42c027e4ff9730fbb3de84c1af0d2c506e41c3e4", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.8577681129305996, "ground_truth": 0}, {"key": "42c027e4ff9730fbb3de84c1af0d2c506e41c3e4", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.8615382070180898, "ground_truth": 0}, {"key": "42c027e4ff9730fbb3de84c1af0d2c506e41c3e4", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.8438950981716087, "ground_truth": 0}, {"key": "42c027e4ff9730fbb3de84c1af0d2c506e41c3e4", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.9118099547108605, "ground_truth": 0}, {"key": "ee8871b15c50d0db17b0179a6d2beab35065f1e9", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.9046505393656534, "ground_truth": 0}, {"key": "ee8871b15c50d0db17b0179a6d2beab35065f1e9", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.7813306204089635, "ground_truth": 0}, {"key": "ee8871b15c50d0db17b0179a6d2beab35065f1e9", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.8354835442325449, "ground_truth": 0}, {"key": "ee8871b15c50d0db17b0179a6d2beab35065f1e9", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.8548846483852173, "ground_truth": 0}, {"key": "ee8871b15c50d0db17b0179a6d2beab35065f1e9", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.8175744676524457, "ground_truth": 0}, {"key": "06352019a19ae31e527f37f7571c6dd7f0c5da37", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.8104789002574955, "ground_truth": 0}, {"key": "06352019a19ae31e527f37f7571c6dd7f0c5da37", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.8652240792269095, "ground_truth": 0}, {"key": "06352019a19ae31e527f37f7571c6dd7f0c5da37", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.6740504753158401, "ground_truth": 0}, {"key": "06352019a19ae31e527f37f7571c6dd7f0c5da37", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.5907792100861421, "ground_truth": 0}, {"key": "06352019a19ae31e527f37f7571c6dd7f0c5da37", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.6893056142488285, "ground_truth": 0}, {"key": "24521a2abb2e1f5e34e6824e0f9e56904a2b0e88", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.9149009599384217, "ground_truth": 0}, {"key": "24521a2abb2e1f5e34e6824e0f9e56904a2b0e88", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.9445872058863943, "ground_truth": 0}, {"key": "24521a2abb2e1f5e34e6824e0f9e56904a2b0e88", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.8697145706611523, "ground_truth": 0}, {"key": "24521a2abb2e1f5e34e6824e0f9e56904a2b0e88", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.919063285366736, "ground_truth": 0}, {"key": "24521a2abb2e1f5e34e6824e0f9e56904a2b0e88", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.9525741308573683, "ground_truth": 0}, {"key": "7fe70cc8b12fab2d0a258fababf7d9c6b5e1262a", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.9246876921962062, "ground_truth": 0}, {"key": "7fe70cc8b12fab2d0a258fababf7d9c6b5e1262a", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.96641049221741, "ground_truth": 0}, {"key": "7fe70cc8b12fab2d0a258fababf7d9c6b5e1262a", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.942081910741279, "ground_truth": 0}, {"key": "7fe70cc8b12fab2d0a258fababf7d9c6b5e1262a", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.9621075716409918, "ground_truth": 0}, {"key": "7fe70cc8b12fab2d0a258fababf7d9c6b5e1262a", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.9111797079885746, "ground_truth": 0}, {"key": "a1ebb8bb4d370a1fdf28769206d572be60642d70", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.8799743753443962, "ground_truth": 0}, {"key": "a1ebb8bb4d370a1fdf28769206d572be60642d70", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.8661325083649123, "ground_truth": 0}, {"key": "a1ebb8bb4d370a1fdf28769206d572be60642d70", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.939913350900279, "ground_truth": 0}, {"key": "a1ebb8bb4d370a1fdf28769206d572be60642d70", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.8031737799770375, "ground_truth": 0}, {"key": "a1ebb8bb4d370a1fdf28769206d572be60642d70", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.872347379692754, "ground_truth": 0}, {"key": "7c0e61ac829a3b3b653e2e3e7536cc4881d1f264", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.7772998626467326, "ground_truth": 0}, {"key": "7c0e61ac829a3b3b653e2e3e7536cc4881d1f264", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.9005297896298636, "ground_truth": 0}, {"key": "7c0e61ac829a3b3b653e2e3e7536cc4881d1f264", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.8606036246564295, "ground_truth": 0}, {"key": "7c0e61ac829a3b3b653e2e3e7536cc4881d1f264", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.7676898520151194, "ground_truth": 0}, {"key": "7c0e61ac829a3b3b653e2e3e7536cc4881d1f264", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.7592253968236831, "ground_truth": 0}, {"key": "f0d73bdab711763e745cdc75850861c9018f235d", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.8679338519605144, "ground_truth": 0}, {"key": "f0d73bdab711763e745cdc75850861c9018f235d", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.8887587806148456, "ground_truth": 0}, {"key": "f0d73bdab711763e745cdc75850861c9018f235d", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.7839884716914692, "ground_truth": 0}, {"key": "f0d73bdab711763e745cdc75850861c9018f235d", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.8128673109680915, "ground_truth": 0}, {"key": "f0d73bdab711763e745cdc75850861c9018f235d", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.8198933306340277, "ground_truth": 0}, {"key": "5e22bbfc7232418b8d2dd646b952e404df5bd048", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.8615382148959334, "ground_truth": 0}, {"key": "5e22bbfc7232418b8d2dd646b952e404df5bd048", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.6842640201200784, "ground_truth": 0}, {"key": "5e22bbfc7232418b8d2dd646b952e404df5bd048", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.7918210590315736, "ground_truth": 0}, {"key": "5e22bbfc7232418b8d2dd646b952e404df5bd048", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.8799743666810328, "ground_truth": 0}, {"key": "5e22bbfc7232418b8d2dd646b952e404df5bd048", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.9496693681887158, "ground_truth": 0}, {"key": "613d6311ec2c1985bd44707d1796d275452fe156", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.8499711796845445, "ground_truth": 0}, {"key": "613d6311ec2c1985bd44707d1796d275452fe156", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.8606036242846111, "ground_truth": 0}, {"key": "613d6311ec2c1985bd44707d1796d275452fe156", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.8732148292628797, "ground_truth": 0}, {"key": "613d6311ec2c1985bd44707d1796d275452fe156", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.7563575412161556, "ground_truth": 0}, {"key": "613d6311ec2c1985bd44707d1796d275452fe156", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.8311430409506831, "ground_truth": 0}, {"key": "017d27d00eb43678c15cb4a8dd4723a035323219", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.8749346133772866, "ground_truth": 0}, {"key": "017d27d00eb43678c15cb4a8dd4723a035323219", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.8104789001426502, "ground_truth": 0}, {"key": "017d27d00eb43678c15cb4a8dd4723a035323219", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.8233283865245565, "ground_truth": 0}, {"key": "017d27d00eb43678c15cb4a8dd4723a035323219", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.8300437615471291, "ground_truth": 0}, {"key": "017d27d00eb43678c15cb4a8dd4723a035323219", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.8740772359655581, "ground_truth": 0}, {"key": "85f55a3e0dd672857aaaaa80954934a57b7a2fbf", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.7563575370301817, "ground_truth": 0}, {"key": "85f55a3e0dd672857aaaaa80954934a57b7a2fbf", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.8872046035206215, "ground_truth": 0}, {"key": "85f55a3e0dd672857aaaaa80954934a57b7a2fbf", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.8221891296092547, "ground_truth": 0}, {"key": "85f55a3e0dd672857aaaaa80954934a57b7a2fbf", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.8289388276857483, "ground_truth": 0}, {"key": "85f55a3e0dd672857aaaaa80954934a57b7a2fbf", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.7732163712421724, "ground_truth": 0}, {"key": "77d7c8cf2a9432e395d629371a12790c563c19f7", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.8807970783322825, "ground_truth": 0}, {"key": "77d7c8cf2a9432e395d629371a12790c563c19f7", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.9496693671535474, "ground_truth": 0}, {"key": "77d7c8cf2a9432e395d629371a12790c563c19f7", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.8902942195077386, "ground_truth": 0}, {"key": "77d7c8cf2a9432e395d629371a12790c563c19f7", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.9086178941660832, "ground_truth": 0}, {"key": "77d7c8cf2a9432e395d629371a12790c563c19f7", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.9518632331639021, "ground_truth": 0}, {"key": "35f0e33de7923036a97ac245d899f990bda5e242", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.7943849544364198, "ground_truth": 0}, {"key": "35f0e33de7923036a97ac245d899f990bda5e242", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.8848377615822047, "ground_truth": 0}, {"key": "35f0e33de7923036a97ac245d899f990bda5e242", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.8407825984950341, "ground_truth": 0}, {"key": "35f0e33de7923036a97ac245d899f990bda5e242", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.8791467676547539, "ground_truth": 0}, {"key": "35f0e33de7923036a97ac245d899f990bda5e242", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.8705972680111459, "ground_truth": 0}, {"key": "2ad31cae96512af5105b9b23f9b681dc732b2605", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.8499711709293422, "ground_truth": 0}, {"key": "2ad31cae96512af5105b9b23f9b681dc732b2605", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.8459424324398805, "ground_truth": 0}, {"key": "2ad31cae96512af5105b9b23f9b681dc732b2605", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.8740772359367482, "ground_truth": 0}, {"key": "2ad31cae96512af5105b9b23f9b681dc732b2605", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.8688267846626074, "ground_truth": 0}, {"key": "2ad31cae96512af5105b9b23f9b681dc732b2605", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.842863155099694, "ground_truth": 0}, {"key": "0d43b97000ff852282c89d8d105e41495c0ee9bd", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.862467527571453, "ground_truth": 0}, {"key": "0d43b97000ff852282c89d8d105e41495c0ee9bd", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.7931059313782487, "ground_truth": 0}, {"key": "0d43b97000ff852282c89d8d105e41495c0ee9bd", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.5078118792844802, "ground_truth": 0}, {"key": "0d43b97000ff852282c89d8d105e41495c0ee9bd", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.8044059213778563, "ground_truth": 0}, {"key": "0d43b97000ff852282c89d8d105e41495c0ee9bd", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.8539127529217361, "ground_truth": 0}, {"key": "bf0cd4ccacd4fe045995338f4c44d9cf18000226", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.9032942108112771, "ground_truth": 0}, {"key": "bf0cd4ccacd4fe045995338f4c44d9cf18000226", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.8044059110913679, "ground_truth": 0}, {"key": "bf0cd4ccacd4fe045995338f4c44d9cf18000226", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.8092759786348263, "ground_truth": 0}, {"key": "bf0cd4ccacd4fe045995338f4c44d9cf18000226", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.9032942049009461, "ground_truth": 0}, {"key": "bf0cd4ccacd4fe045995338f4c44d9cf18000226", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.816406381516814, "ground_truth": 0}, {"key": "2f43e9dfaa43ffbddbce339a8b6403ddce43b38a", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.7981867799642567, "ground_truth": 0}, {"key": "2f43e9dfaa43ffbddbce339a8b6403ddce43b38a", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.8587185763316392, "ground_truth": 0}, {"key": "2f43e9dfaa43ffbddbce339a8b6403ddce43b38a", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.7217432120068258, "ground_truth": 0}, {"key": "2f43e9dfaa43ffbddbce339a8b6403ddce43b38a", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.8714748623656439, "ground_truth": 0}, {"key": "2f43e9dfaa43ffbddbce339a8b6403ddce43b38a", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.8864204109359078, "ground_truth": 0}, {"key": "eb68bc51ed4fc727a1af058192a3fef0916c91e7", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.917893373745859, "ground_truth": 0}, {"key": "eb68bc51ed4fc727a1af058192a3fef0916c91e7", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.8766343842664845, "ground_truth": 0}, {"key": "eb68bc51ed4fc727a1af058192a3fef0916c91e7", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.9046505356767476, "ground_truth": 0}, {"key": "eb68bc51ed4fc727a1af058192a3fef0916c91e7", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.8080672151378033, "ground_truth": 0}, {"key": "eb68bc51ed4fc727a1af058192a3fef0916c91e7", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.8344068737200139, "ground_truth": 0}, {"key": "ad021a7924ee57491cee8576499ac196b1afeb23", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.7606506603258355, "ground_truth": 0}, {"key": "ad021a7924ee57491cee8576499ac196b1afeb23", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.8407825978746416, "ground_truth": 0}, {"key": "ad021a7924ee57491cee8576499ac196b1afeb23", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.7634837603404858, "ground_truth": 0}, {"key": "ad021a7924ee57491cee8576499ac196b1afeb23", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.8732148242510823, "ground_truth": 0}, {"key": "ad021a7924ee57491cee8576499ac196b1afeb23", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.8418256486319912, "ground_truth": 0}, {"key": "9d7fc7fd9ffbfecb1c458b9929fa02e6c3538368", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.8925625264155154, "ground_truth": 0}, {"key": "9d7fc7fd9ffbfecb1c458b9929fa02e6c3538368", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.946990227111847, "ground_truth": 0}, {"key": "9d7fc7fd9ffbfecb1c458b9929fa02e6c3538368", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.899827770091308, "ground_truth": 0}, {"key": "9d7fc7fd9ffbfecb1c458b9929fa02e6c3538368", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.8933094029750237, "ground_truth": 0}, {"key": "9d7fc7fd9ffbfecb1c458b9929fa02e6c3538368", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.9465966692492073, "ground_truth": 0}, {"key": "30cb674030b01014d2c87b92f09152857e249631", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.8300437514434175, "ground_truth": 0}, {"key": "30cb674030b01014d2c87b92f09152857e249631", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.8633916049613503, "ground_truth": 0}, {"key": "30cb674030b01014d2c87b92f09152857e249631", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.8289388259945503, "ground_truth": 0}, {"key": "30cb674030b01014d2c87b92f09152857e249631", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.6926419877744632, "ground_truth": 0}, {"key": "30cb674030b01014d2c87b92f09152857e249631", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.8333245950516484, "ground_truth": 0}, {"key": "d41dc7fc05273a37f0aceaf4f3e35a187f12653e", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.9252299513865633, "ground_truth": 0}, {"key": "d41dc7fc05273a37f0aceaf4f3e35a187f12653e", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.8104788951925429, "ground_truth": 0}, {"key": "d41dc7fc05273a37f0aceaf4f3e35a187f12653e", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.6460136886403909, "ground_truth": 0}, {"key": "d41dc7fc05273a37f0aceaf4f3e35a187f12653e", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.774583403851713, "ground_truth": 0}, {"key": "d41dc7fc05273a37f0aceaf4f3e35a187f12653e", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.8509646899567038, "ground_truth": 0}, {"key": "fbc6a4d0697b2a3e8b549dcb1f80a8ce7bf47e34", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.8895288606795614, "ground_truth": 0}, {"key": "fbc6a4d0697b2a3e8b549dcb1f80a8ce7bf47e34", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.8740772280154193, "ground_truth": 0}, {"key": "fbc6a4d0697b2a3e8b549dcb1f80a8ce7bf47e34", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.8418256562894136, "ground_truth": 0}, {"key": "fbc6a4d0697b2a3e8b549dcb1f80a8ce7bf47e34", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.8221891351583456, "ground_truth": 0}, {"key": "fbc6a4d0697b2a3e8b549dcb1f80a8ce7bf47e34", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.8925625378120873, "ground_truth": 0}, {"key": "0753a471e6908c35bcbc2daa37e21f3a8443b590", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.9066531247009835, "ground_truth": 0}, {"key": "0753a471e6908c35bcbc2daa37e21f3a8443b590", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.8289388086567349, "ground_truth": 0}, {"key": "0753a471e6908c35bcbc2daa37e21f3a8443b590", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.912436158275545, "ground_truth": 0}, {"key": "0753a471e6908c35bcbc2daa37e21f3a8443b590", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.9099070129634665, "ground_truth": 0}, {"key": "0753a471e6908c35bcbc2daa37e21f3a8443b590", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.9207896794755565, "ground_truth": 0}, {"key": "08450c1bc03472825196be1acb02ac0e13bef939", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.6315942850243825, "ground_truth": 0}, {"key": "08450c1bc03472825196be1acb02ac0e13bef939", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.7690802546559434, "ground_truth": 0}, {"key": "08450c1bc03472825196be1acb02ac0e13bef939", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.7008948205737254, "ground_truth": 0}, {"key": "08450c1bc03472825196be1acb02ac0e13bef939", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.8080672055983719, "ground_truth": 0}, {"key": "08450c1bc03472825196be1acb02ac0e13bef939", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.9437636523315245, "ground_truth": 0}, {"key": "7fa8d9beca50155fd3d71a9087a4311ce321c34b", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.8774767852521423, "ground_truth": 0}, {"key": "7fa8d9beca50155fd3d71a9087a4311ce321c34b", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.7476159587626702, "ground_truth": 0}, {"key": "7fa8d9beca50155fd3d71a9087a4311ce321c34b", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.7090191428309691, "ground_truth": 0}, {"key": "7fa8d9beca50155fd3d71a9087a4311ce321c34b", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.8887587958473124, "ground_truth": 0}, {"key": "7fa8d9beca50155fd3d71a9087a4311ce321c34b", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.8210441164233291, "ground_truth": 0}, {"key": "414a5b8ecbe189d2767c75b839775a1dcafaf4d3", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.6242935043430867, "ground_truth": 0}, {"key": "414a5b8ecbe189d2767c75b839775a1dcafaf4d3", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.77594455085242, "ground_truth": 0}, {"key": "414a5b8ecbe189d2767c75b839775a1dcafaf4d3", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.6774740189211832, "ground_truth": 0}, {"key": "414a5b8ecbe189d2767c75b839775a1dcafaf4d3", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.5907791933307732, "ground_truth": 0}, {"key": "414a5b8ecbe189d2767c75b839775a1dcafaf4d3", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.6113819745344469, "ground_truth": 0}, {"key": "cac7a712935380d74410a7cba8d406235d51249a", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.8864204150462085, "ground_truth": 0}, {"key": "cac7a712935380d74410a7cba8d406235d51249a", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.8428631459065935, "ground_truth": 0}, {"key": "cac7a712935380d74410a7cba8d406235d51249a", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.8397339719631349, "ground_truth": 0}, {"key": "cac7a712935380d74410a7cba8d406235d51249a", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.8774767852000933, "ground_truth": 0}, {"key": "cac7a712935380d74410a7cba8d406235d51249a", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.8887587826281217, "ground_truth": 0}, {"key": "e9093ca0a82f2aba28cd2762942c04177cfbb000", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.8624675302464077, "ground_truth": 0}, {"key": "e9093ca0a82f2aba28cd2762942c04177cfbb000", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.9005297917588404, "ground_truth": 0}, {"key": "e9093ca0a82f2aba28cd2762942c04177cfbb000", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.7799928933902582, "ground_truth": 0}, {"key": "e9093ca0a82f2aba28cd2762942c04177cfbb000", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.894051721158551, "ground_truth": 0}, {"key": "e9093ca0a82f2aba28cd2762942c04177cfbb000", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.8116760250753103, "ground_truth": 0}, {"key": "55a6aabd120f0b18297f7efe22452f9b3aca0d8d", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.9079671364256278, "ground_truth": 0}, {"key": "55a6aabd120f0b18297f7efe22452f9b3aca0d8d", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.9092645200297798, "ground_truth": 0}, {"key": "55a6aabd120f0b18297f7efe22452f9b3aca0d8d", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.9449947176401167, "ground_truth": 0}, {"key": "55a6aabd120f0b18297f7efe22452f9b3aca0d8d", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.9618217224440541, "ground_truth": 0}, {"key": "55a6aabd120f0b18297f7efe22452f9b3aca0d8d", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.9713473321075111, "ground_truth": 0}, {"key": "06bc2f0272d033b123e9eebbb221c62d7d51c283", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.7154239931213764, "ground_truth": 0}, {"key": "06bc2f0272d033b123e9eebbb221c62d7d51c283", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.474631172759741, "ground_truth": 0}, {"key": "06bc2f0272d033b123e9eebbb221c62d7d51c283", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.6370308011264527, "ground_truth": 0}, {"key": "06bc2f0272d033b123e9eebbb221c62d7d51c283", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.709019134787688, "ground_truth": 0}, {"key": "06bc2f0272d033b123e9eebbb221c62d7d51c283", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.7041601240592279, "ground_truth": 0}, {"key": "17e43e8e7d2bbbb237df78537d108c3fa917d9fb", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.9730365000147392, "ground_truth": 0}, {"key": "17e43e8e7d2bbbb237df78537d108c3fa917d9fb", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.9822877012425021, "ground_truth": 0}, {"key": "17e43e8e7d2bbbb237df78537d108c3fa917d9fb", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.9817357218886431, "ground_truth": 0}, {"key": "17e43e8e7d2bbbb237df78537d108c3fa917d9fb", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.9666631735028451, "ground_truth": 0}, {"key": "17e43e8e7d2bbbb237df78537d108c3fa917d9fb", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.9851575823344132, "ground_truth": 0}, {"key": "ddcdeb9bdd19fa23f9495c85d48eeee910f33102", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.8333245957993586, "ground_truth": 0}, {"key": "ddcdeb9bdd19fa23f9495c85d48eeee910f33102", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.9437636512919029, "ground_truth": 0}, {"key": "ddcdeb9bdd19fa23f9495c85d48eeee910f33102", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.8679338440236731, "ground_truth": 0}, {"key": "ddcdeb9bdd19fa23f9495c85d48eeee910f33102", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.8479677469894904, "ground_truth": 0}, {"key": "ddcdeb9bdd19fa23f9495c85d48eeee910f33102", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.91789336802898, "ground_truth": 0}, {"key": "ee0ba7928d8987f2cb21c9a2012a76730f77de45", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.7799929127300493, "ground_truth": 0}, {"key": "ee0ba7928d8987f2cb21c9a2012a76730f77de45", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.7826624859344686, "ground_truth": 0}, {"key": "ee0ba7928d8987f2cb21c9a2012a76730f77de45", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.8056321664044037, "ground_truth": 0}, {"key": "ee0ba7928d8987f2cb21c9a2012a76730f77de45", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.6477982222300418, "ground_truth": 0}, {"key": "ee0ba7928d8987f2cb21c9a2012a76730f77de45", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.7648916122626701, "ground_truth": 0}, {"key": "554fd99f28ae12472c5d99ef6383bb184744c25a", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.7813306142370909, "ground_truth": 0}, {"key": "554fd99f28ae12472c5d99ef6383bb184744c25a", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.822189137545897, "ground_truth": 0}, {"key": "554fd99f28ae12472c5d99ef6383bb184744c25a", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.8757869863042566, "ground_truth": 0}, {"key": "554fd99f28ae12472c5d99ef6383bb184744c25a", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.7090191367512667, "ground_truth": 0}, {"key": "554fd99f28ae12472c5d99ef6383bb184744c25a", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.7994423079902466, "ground_truth": 0}, {"key": "9e141ebc1c06d483bf85f4e5c8b3c7bc2d00ea2f", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.8652240744209926, "ground_truth": 0}, {"key": "9e141ebc1c06d483bf85f4e5c8b3c7bc2d00ea2f", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.713830738260751, "ground_truth": 0}, {"key": "9e141ebc1c06d483bf85f4e5c8b3c7bc2d00ea2f", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.702530048678845, "ground_truth": 0}, {"key": "9e141ebc1c06d483bf85f4e5c8b3c7bc2d00ea2f", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.8519528169794722, "ground_truth": 0}, {"key": "9e141ebc1c06d483bf85f4e5c8b3c7bc2d00ea2f", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.7759445451865833, "ground_truth": 0}, {"key": "c9160e2f5ce386dabb10517e7a5c0933c01a9546", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.8519528122108035, "ground_truth": 0}, {"key": "c9160e2f5ce386dabb10517e7a5c0933c01a9546", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.8365545678236094, "ground_truth": 0}, {"key": "c9160e2f5ce386dabb10517e7a5c0933c01a9546", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.7690802427885788, "ground_truth": 0}, {"key": "c9160e2f5ce386dabb10517e7a5c0933c01a9546", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.7248702683676828, "ground_truth": 0}, {"key": "c9160e2f5ce386dabb10517e7a5c0933c01a9546", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.8116760163526373, "ground_truth": 0}, {"key": "d256aee1a47eb5b489dee6fb72ab7f7d1483a37f", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.689305601935717, "ground_truth": 0}, {"key": "d256aee1a47eb5b489dee6fb72ab7f7d1483a37f", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.8221891180306498, "ground_truth": 0}, {"key": "d256aee1a47eb5b489dee6fb72ab7f7d1483a37f", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.7325918226860865, "ground_truth": 0}, {"key": "d256aee1a47eb5b489dee6fb72ab7f7d1483a37f", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.754914985981852, "ground_truth": 0}, {"key": "d256aee1a47eb5b489dee6fb72ab7f7d1483a37f", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.7090191471439329, "ground_truth": 0}, {"key": "2fff2bc541ef34a6647dfa2e4294cdcc187e47b9", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.7185943978724412, "ground_truth": 0}, {"key": "2fff2bc541ef34a6647dfa2e4294cdcc187e47b9", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.7386690805629751, "ground_truth": 0}, {"key": "2fff2bc541ef34a6647dfa2e4294cdcc187e47b9", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.7577943675711849, "ground_truth": 0}, {"key": "2fff2bc541ef34a6647dfa2e4294cdcc187e47b9", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.6774740064063378, "ground_truth": 0}, {"key": "2fff2bc541ef34a6647dfa2e4294cdcc187e47b9", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.685949440340023, "ground_truth": 0}, {"key": "677375a4c69e81ab623af7c06a6b0a8d03d6350e", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.8019358218325386, "ground_truth": 0}, {"key": "677375a4c69e81ab623af7c06a6b0a8d03d6350e", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.6169358158698339, "ground_truth": 0}, {"key": "677375a4c69e81ab623af7c06a6b0a8d03d6350e", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.7943849606761778, "ground_truth": 0}, {"key": "677375a4c69e81ab623af7c06a6b0a8d03d6350e", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.7606506684011176, "ground_truth": 0}, {"key": "677375a4c69e81ab623af7c06a6b0a8d03d6350e", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.6113819940519597, "ground_truth": 0}, {"key": "33530f97118cc905b05cb920671492c7bfdf3a3b", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.838679759676369, "ground_truth": 0}, {"key": "33530f97118cc905b05cb920671492c7bfdf3a3b", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.9284088047918192, "ground_truth": 0}, {"key": "33530f97118cc905b05cb920671492c7bfdf3a3b", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.9053223003483101, "ground_truth": 0}, {"key": "33530f97118cc905b05cb920671492c7bfdf3a3b", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.6926419648971077, "ground_truth": 0}, {"key": "33530f97118cc905b05cb920671492c7bfdf3a3b", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.9202179839381163, "ground_truth": 0}, {"key": "3c19a753303ae0d67b3ae28e070c0f4157ffc52d", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.8848377663430707, "ground_truth": 0}, {"key": "3c19a753303ae0d67b3ae28e070c0f4157ffc52d", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.794384962789496, "ground_truth": 0}, {"key": "3c19a753303ae0d67b3ae28e070c0f4157ffc52d", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.8723473828912652, "ground_truth": 0}, {"key": "3c19a753303ae0d67b3ae28e070c0f4157ffc52d", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.7918210614974127, "ground_truth": 0}, {"key": "3c19a753303ae0d67b3ae28e070c0f4157ffc52d", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.8529354706869706, "ground_truth": 0}, {"key": "9313988d26672c576f08e130c895edf20d8aa626", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.7341195294012588, "ground_truth": 0}, {"key": "9313988d26672c576f08e130c895edf20d8aa626", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.8499711805753611, "ground_truth": 0}, {"key": "9313988d26672c576f08e130c895edf20d8aa626", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.8175744743759036, "ground_truth": 0}, {"key": "9313988d26672c576f08e130c895edf20d8aa626", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.9207896787844969, "ground_truth": 0}, {"key": "9313988d26672c576f08e130c895edf20d8aa626", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.9026095989771766, "ground_truth": 0}, {"key": "72f4a6670ec7ec915c83d58bb0ebf152b1605bb6", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.8438950979768963, "ground_truth": 0}, {"key": "72f4a6670ec7ec915c83d58bb0ebf152b1605bb6", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.9046505379397279, "ground_truth": 0}, {"key": "72f4a6670ec7ec915c83d58bb0ebf152b1605bb6", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.8289388181226232, "ground_truth": 0}, {"key": "72f4a6670ec7ec915c83d58bb0ebf152b1605bb6", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.9425067207943092, "ground_truth": 0}, {"key": "72f4a6670ec7ec915c83d58bb0ebf152b1605bb6", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.847967761399492, "ground_truth": 0}, {"key": "b73f50e29d5b2943eb315643bef8ee4e09f5605b", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.6859494422916962, "ground_truth": 0}, {"key": "b73f50e29d5b2943eb315643bef8ee4e09f5605b", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.7025300602494118, "ground_truth": 0}, {"key": "b73f50e29d5b2943eb315643bef8ee4e09f5605b", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.5869964342620301, "ground_truth": 0}, {"key": "b73f50e29d5b2943eb315643bef8ee4e09f5605b", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.6297746263382253, "ground_truth": 0}, {"key": "b73f50e29d5b2943eb315643bef8ee4e09f5605b", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.47852884209517815, "ground_truth": 0}, {"key": "f9689fb9656132e1c6d186851563f2b968643791", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.7676898453640869, "ground_truth": 0}, {"key": "f9689fb9656132e1c6d186851563f2b968643791", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.7994423174518486, "ground_truth": 0}, {"key": "f9689fb9656132e1c6d186851563f2b968643791", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.7892337172957653, "ground_truth": 0}, {"key": "f9689fb9656132e1c6d186851563f2b968643791", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.7490872044257986, "ground_truth": 0}, {"key": "f9689fb9656132e1c6d186851563f2b968643791", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.7786493105311264, "ground_truth": 0}, {"key": "63831b842812b1a3d05b04904a10d160fe7ad2af", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.9525741297556791, "ground_truth": 0}, {"key": "63831b842812b1a3d05b04904a10d160fe7ad2af", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.9529258213113136, "ground_truth": 0}, {"key": "63831b842812b1a3d05b04904a10d160fe7ad2af", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.9485372346686768, "ground_truth": 0}, {"key": "63831b842812b1a3d05b04904a10d160fe7ad2af", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.9757623657075043, "ground_truth": 0}, {"key": "63831b842812b1a3d05b04904a10d160fe7ad2af", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.8848377730358903, "ground_truth": 0}, {"key": "05688bac0e46542be65a6df240428a6f26c86fd0", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.9367494726389809, "ground_truth": 0}, {"key": "05688bac0e46542be65a6df240428a6f26c86fd0", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.9257686332470262, "ground_truth": 0}, {"key": "05688bac0e46542be65a6df240428a6f26c86fd0", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.9385759614814931, "ground_truth": 0}, {"key": "05688bac0e46542be65a6df240428a6f26c86fd0", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.9469902285295442, "ground_truth": 0}, {"key": "05688bac0e46542be65a6df240428a6f26c86fd0", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.9496693668461013, "ground_truth": 0}, {"key": "5ba0d22ccba29ac8a3c77da069165d6016f5a214", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.7634837590890063, "ground_truth": 0}, {"key": "5ba0d22ccba29ac8a3c77da069165d6016f5a214", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.8840392826565003, "ground_truth": 0}, {"key": "5ba0d22ccba29ac8a3c77da069165d6016f5a214", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.7943849567995539, "ground_truth": 0}, {"key": "5ba0d22ccba29ac8a3c77da069165d6016f5a214", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.7981867852303589, "ground_truth": 0}, {"key": "5ba0d22ccba29ac8a3c77da069165d6016f5a214", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.8365545591649797, "ground_truth": 0}, {"key": "9f63d6256158d260c426a9336d19b760d9bc5a48", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.8344068900355083, "ground_truth": 0}, {"key": "9f63d6256158d260c426a9336d19b760d9bc5a48", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.900529790071326, "ground_truth": 0}, {"key": "9f63d6256158d260c426a9336d19b760d9bc5a48", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.9268352812834915, "ground_truth": 0}, {"key": "9f63d6256158d260c426a9336d19b760d9bc5a48", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.868826785655212, "ground_truth": 0}, {"key": "9f63d6256158d260c426a9336d19b760d9bc5a48", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.9241418188115864, "ground_truth": 0}, {"key": "fb6516de631cade629b797e8f40f377523c4aa0e", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.954984466471875, "ground_truth": 0}, {"key": "fb6516de631cade629b797e8f40f377523c4aa0e", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.9178933646016675, "ground_truth": 0}, {"key": "fb6516de631cade629b797e8f40f377523c4aa0e", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.934395162925047, "ground_truth": 0}, {"key": "fb6516de631cade629b797e8f40f377523c4aa0e", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.9294404053234562, "ground_truth": 0}, {"key": "fb6516de631cade629b797e8f40f377523c4aa0e", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.9420819133748882, "ground_truth": 0}, {"key": "0a71f063b78184b4ca2ffee3c642d48dc27ef91b", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.7879311951981097, "ground_truth": 0}, {"key": "0a71f063b78184b4ca2ffee3c642d48dc27ef91b", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.8322366481316908, "ground_truth": 0}, {"key": "0a71f063b78184b4ca2ffee3c642d48dc27ef91b", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.8104788924323569, "ground_truth": 0}, {"key": "0a71f063b78184b4ca2ffee3c642d48dc27ef91b", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.822189127083655, "ground_truth": 0}, {"key": "0a71f063b78184b4ca2ffee3c642d48dc27ef91b", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.6909762845882952, "ground_truth": 0}, {"key": "700e0d133d2f5c2e65960aae7bffa66bb62c0df4", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.7981867748929193, "ground_truth": 0}, {"key": "700e0d133d2f5c2e65960aae7bffa66bb62c0df4", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.6976089073435441, "ground_truth": 0}, {"key": "700e0d133d2f5c2e65960aae7bffa66bb62c0df4", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.821044096298751, "ground_truth": 0}, {"key": "700e0d133d2f5c2e65960aae7bffa66bb62c0df4", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.7994423098062069, "ground_truth": 0}, {"key": "700e0d133d2f5c2e65960aae7bffa66bb62c0df4", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.7461389865074842, "ground_truth": 0}, {"key": "180642a2ddfce93ceaf3ee3ec4779400fe67ae1e", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.6893056270509315, "ground_truth": 0}, {"key": "180642a2ddfce93ceaf3ee3ec4779400fe67ae1e", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.6893055980557434, "ground_truth": 0}, {"key": "180642a2ddfce93ceaf3ee3ec4779400fe67ae1e", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.9130583389763678, "ground_truth": 0}, {"key": "180642a2ddfce93ceaf3ee3ec4779400fe67ae1e", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.6297746104839685, "ground_truth": 0}, {"key": "180642a2ddfce93ceaf3ee3ec4779400fe67ae1e", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.7704647787192758, "ground_truth": 0}, {"key": "3e868fbad714ceab14a41fa9dd5d8a40204f2199", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.9032942108836585, "ground_truth": 0}, {"key": "3e868fbad714ceab14a41fa9dd5d8a40204f2199", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.8933094015262993, "ground_truth": 0}, {"key": "3e868fbad714ceab14a41fa9dd5d8a40204f2199", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.9532750418111208, "ground_truth": 0}, {"key": "3e868fbad714ceab14a41fa9dd5d8a40204f2199", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.928408798568228, "ground_truth": 0}, {"key": "3e868fbad714ceab14a41fa9dd5d8a40204f2199", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.9339146243308696, "ground_truth": 0}, {"key": "8b0a818edcbbefb79dd40a19b08119f6848083db", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.9367494701009282, "ground_truth": 0}, {"key": "8b0a818edcbbefb79dd40a19b08119f6848083db", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.900529790071326, "ground_truth": 0}, {"key": "8b0a818edcbbefb79dd40a19b08119f6848083db", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.7090191316820471, "ground_truth": 0}, {"key": "8b0a818edcbbefb79dd40a19b08119f6848083db", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.8233283852264108, "ground_truth": 0}, {"key": "8b0a818edcbbefb79dd40a19b08119f6848083db", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.8615382083336574, "ground_truth": 0}, {"key": "ceb7a288ac1ad604a17bc25c5978fcc87b1a4446", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.9190632907689382, "ground_truth": 0}, {"key": "ceb7a288ac1ad604a17bc25c5978fcc87b1a4446", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.8633916067265419, "ground_truth": 0}, {"key": "ceb7a288ac1ad604a17bc25c5978fcc87b1a4446", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.9079671352344877, "ground_truth": 0}, {"key": "ceb7a288ac1ad604a17bc25c5978fcc87b1a4446", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.8244619354043218, "ground_truth": 0}, {"key": "ceb7a288ac1ad604a17bc25c5978fcc87b1a4446", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.9178933701460955, "ground_truth": 0}, {"key": "a228e744966fe03eca515b971329acacf9feabb2", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.9257686296724974, "ground_truth": 0}, {"key": "a228e744966fe03eca515b971329acacf9feabb2", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.8998277719764112, "ground_truth": 0}, {"key": "a228e744966fe03eca515b971329acacf9feabb2", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.9196425311762432, "ground_truth": 0}, {"key": "a228e744966fe03eca515b971329acacf9feabb2", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.8459424314251963, "ground_truth": 0}, {"key": "a228e744966fe03eca515b971329acacf9feabb2", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.924687694004417, "ground_truth": 0}, {"key": "c44238ec87e7fc40ab7fe6e724cfcbf301e01216", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.7416740157122004, "ground_truth": 0}, {"key": "c44238ec87e7fc40ab7fe6e724cfcbf301e01216", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.8056321825782248, "ground_truth": 0}, {"key": "c44238ec87e7fc40ab7fe6e724cfcbf301e01216", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.7520125693788372, "ground_truth": 0}, {"key": "c44238ec87e7fc40ab7fe6e724cfcbf301e01216", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.7138307423500586, "ground_truth": 0}, {"key": "c44238ec87e7fc40ab7fe6e724cfcbf301e01216", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.5869964354604418, "ground_truth": 0}, {"key": "fff32094b00f3780cc98fe43bd98aace4b851281", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.9111797082690326, "ground_truth": 0}, {"key": "fff32094b00f3780cc98fe43bd98aace4b851281", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.8902942229564474, "ground_truth": 0}, {"key": "fff32094b00f3780cc98fe43bd98aace4b851281", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.7295197703446271, "ground_truth": 0}, {"key": "fff32094b00f3780cc98fe43bd98aace4b851281", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.9202179828592281, "ground_truth": 0}, {"key": "fff32094b00f3780cc98fe43bd98aace4b851281", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.9273632915089107, "ground_truth": 0}, {"key": "373ef5be1d84b8c4905193e569e0cf8a7ead3d03", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.9241418184653338, "ground_truth": 0}, {"key": "373ef5be1d84b8c4905193e569e0cf8a7ead3d03", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.9294404002324842, "ground_truth": 0}, {"key": "373ef5be1d84b8c4905193e569e0cf8a7ead3d03", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.9026095984015654, "ground_truth": 0}, {"key": "373ef5be1d84b8c4905193e569e0cf8a7ead3d03", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.9124361549060875, "ground_truth": 0}, {"key": "373ef5be1d84b8c4905193e569e0cf8a7ead3d03", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.9196425319690296, "ground_truth": 0}, {"key": "f372b28e3d1f74d60aa8ee29d7bdd49a6e7f9779", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.9890976258687564, "ground_truth": 0}, {"key": "f372b28e3d1f74d60aa8ee29d7bdd49a6e7f9779", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.9876638994769343, "ground_truth": 0}, {"key": "f372b28e3d1f74d60aa8ee29d7bdd49a6e7f9779", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.9666631735812964, "ground_truth": 0}, {"key": "f372b28e3d1f74d60aa8ee29d7bdd49a6e7f9779", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.988038901065738, "ground_truth": 0}, {"key": "f372b28e3d1f74d60aa8ee29d7bdd49a6e7f9779", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.9828232895649583, "ground_truth": 0}, {"key": "fbcaa7519e9ff82193afbaed67d8706f2350125f", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.8596637470333812, "ground_truth": 0}, {"key": "fbcaa7519e9ff82193afbaed67d8706f2350125f", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.9099070041091974, "ground_truth": 0}, {"key": "fbcaa7519e9ff82193afbaed67d8706f2350125f", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.8723473844844987, "ground_truth": 0}, {"key": "fbcaa7519e9ff82193afbaed67d8706f2350125f", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.7918210707384875, "ground_truth": 0}, {"key": "fbcaa7519e9ff82193afbaed67d8706f2350125f", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.8080672108754573, "ground_truth": 0}, {"key": "5ebd041d89a2ba41b387c30293f0657eef746910", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.8947894583004683, "ground_truth": 0}, {"key": "5ebd041d89a2ba41b387c30293f0657eef746910", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.6976089163610741, "ground_truth": 0}, {"key": "5ebd041d89a2ba41b387c30293f0657eef746910", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.7879311989044824, "ground_truth": 0}, {"key": "5ebd041d89a2ba41b387c30293f0657eef746910", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.7634837940641603, "ground_truth": 0}, {"key": "5ebd041d89a2ba41b387c30293f0657eef746910", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.7074047122453356, "ground_truth": 0}, {"key": "ac4ae79796d05506dabe4380c24f7dd423e09965", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.7505527637017513, "ground_truth": 0}, {"key": "ac4ae79796d05506dabe4380c24f7dd423e09965", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.9086178967976314, "ground_truth": 0}, {"key": "ac4ae79796d05506dabe4380c24f7dd423e09965", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.8449215289879461, "ground_truth": 0}, {"key": "ac4ae79796d05506dabe4380c24f7dd423e09965", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.709019125994145, "ground_truth": 0}, {"key": "ac4ae79796d05506dabe4380c24f7dd423e09965", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.8799743703320739, "ground_truth": 0}, {"key": "62827a1a377491d88adcbac25ecf14a64b5f997b", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.8128673186188182, "ground_truth": 0}, {"key": "62827a1a377491d88adcbac25ecf14a64b5f997b", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.9059898180776956, "ground_truth": 0}, {"key": "62827a1a377491d88adcbac25ecf14a64b5f997b", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.9149009616882909, "ground_truth": 0}, {"key": "62827a1a377491d88adcbac25ecf14a64b5f997b", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.8723473815819018, "ground_truth": 0}, {"key": "62827a1a377491d88adcbac25ecf14a64b5f997b", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.8714748646866235, "ground_truth": 0}, {"key": "d42463e1093a92ec4dbd20edd8f4bf3306f00f3f", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.8397339730063188, "ground_truth": 0}, {"key": "d42463e1093a92ec4dbd20edd8f4bf3306f00f3f", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.7185944022204099, "ground_truth": 0}, {"key": "d42463e1093a92ec4dbd20edd8f4bf3306f00f3f", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.791821060685658, "ground_truth": 0}, {"key": "d42463e1093a92ec4dbd20edd8f4bf3306f00f3f", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.8933094022359154, "ground_truth": 0}, {"key": "d42463e1093a92ec4dbd20edd8f4bf3306f00f3f", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.6636689512061174, "ground_truth": 0}, {"key": "4b0eda92463958cce8c6b2537db39088e1254552", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.7476159507763608, "ground_truth": 0}, {"key": "4b0eda92463958cce8c6b2537db39088e1254552", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.9257686311044117, "ground_truth": 0}, {"key": "4b0eda92463958cce8c6b2537db39088e1254552", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.8548846394072537, "ground_truth": 0}, {"key": "4b0eda92463958cce8c6b2537db39088e1254552", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.7918210587943791, "ground_truth": 0}, {"key": "4b0eda92463958cce8c6b2537db39088e1254552", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.8799743736897795, "ground_truth": 0}, {"key": "e117408ad19cc69e15b1e21b9ae54f10c07223ce", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.8624675417539123, "ground_truth": 0}, {"key": "e117408ad19cc69e15b1e21b9ae54f10c07223ce", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.7041601269344622, "ground_truth": 0}, {"key": "e117408ad19cc69e15b1e21b9ae54f10c07223ce", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.7170118982043384, "ground_truth": 0}, {"key": "e117408ad19cc69e15b1e21b9ae54f10c07223ce", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.7866228435222977, "ground_truth": 0}, {"key": "e117408ad19cc69e15b1e21b9ae54f10c07223ce", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.8791467730813579, "ground_truth": 0}, {"key": "3c5b68b58c34853baa534d1265ec7fde00d4eb4e", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.8104789124635468, "ground_truth": 0}, {"key": "3c5b68b58c34853baa534d1265ec7fde00d4eb4e", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.8080672162246113, "ground_truth": 0}, {"key": "3c5b68b58c34853baa534d1265ec7fde00d4eb4e", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.839733975145148, "ground_truth": 0}, {"key": "3c5b68b58c34853baa534d1265ec7fde00d4eb4e", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.7592254060666566, "ground_truth": 0}, {"key": "3c5b68b58c34853baa534d1265ec7fde00d4eb4e", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.9485372344890596, "ground_truth": 0}, {"key": "6c3d2feed04c75063d182103f0585c45da9aaa1b", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.8624675285981528, "ground_truth": 0}, {"key": "6c3d2feed04c75063d182103f0585c45da9aaa1b", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.8175744807809266, "ground_truth": 0}, {"key": "6c3d2feed04c75063d182103f0585c45da9aaa1b", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.7490872114687498, "ground_truth": 0}, {"key": "6c3d2feed04c75063d182103f0585c45da9aaa1b", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.7745833766538228, "ground_truth": 0}, {"key": "6c3d2feed04c75063d182103f0585c45da9aaa1b", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.685949441928734, "ground_truth": 0}, {"key": "4fa1c0bd7f86368d7ae7730d95ff7e73dc9172da", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.8940517181774721, "ground_truth": 0}, {"key": "4fa1c0bd7f86368d7ae7730d95ff7e73dc9172da", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.9507778821591087, "ground_truth": 0}, {"key": "4fa1c0bd7f86368d7ae7730d95ff7e73dc9172da", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.9334308089095914, "ground_truth": 0}, {"key": "4fa1c0bd7f86368d7ae7730d95ff7e73dc9172da", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.8947894585491761, "ground_truth": 0}, {"key": "4fa1c0bd7f86368d7ae7730d95ff7e73dc9172da", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.958226123215953, "ground_truth": 0}, {"key": "282f1910bd57e50d4401c695ebe75b817de68548", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.8418256477404085, "ground_truth": 0}, {"key": "282f1910bd57e50d4401c695ebe75b817de68548", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.8697145819818212, "ground_truth": 0}, {"key": "282f1910bd57e50d4401c695ebe75b817de68548", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.8933094102152911, "ground_truth": 0}, {"key": "282f1910bd57e50d4401c695ebe75b817de68548", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.9026096013824291, "ground_truth": 0}, {"key": "282f1910bd57e50d4401c695ebe75b817de68548", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.9381240125813851, "ground_truth": 0}, {"key": "af2d712599be471d1ba0b91fa18c347220ca595d", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.7185944125348691, "ground_truth": 0}, {"key": "af2d712599be471d1ba0b91fa18c347220ca595d", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.8568122970395261, "ground_truth": 0}, {"key": "af2d712599be471d1ba0b91fa18c347220ca595d", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.7813306463954744, "ground_truth": 0}, {"key": "af2d712599be471d1ba0b91fa18c347220ca595d", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.83114303876793, "ground_truth": 0}, {"key": "af2d712599be471d1ba0b91fa18c347220ca595d", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.8140527927954445, "ground_truth": 0}, {"key": "e3dd06d326c8d53722bdc5c8428e29c68a60d0d5", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.9019206757768401, "ground_truth": 0}, {"key": "e3dd06d326c8d53722bdc5c8428e29c68a60d0d5", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.8895288524963549, "ground_truth": 0}, {"key": "e3dd06d326c8d53722bdc5c8428e29c68a60d0d5", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.9092645125059474, "ground_truth": 0}, {"key": "e3dd06d326c8d53722bdc5c8428e29c68a60d0d5", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.7866228324747505, "ground_truth": 0}, {"key": "e3dd06d326c8d53722bdc5c8428e29c68a60d0d5", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.8766343844331927, "ground_truth": 0}, {"key": "493fa8c40d1bc26ed1d25633c779b13bc33efdba", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.9039745065610852, "ground_truth": 0}, {"key": "493fa8c40d1bc26ed1d25633c779b13bc33efdba", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.8895288508992925, "ground_truth": 0}, {"key": "493fa8c40d1bc26ed1d25633c779b13bc33efdba", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.8732148380537279, "ground_truth": 0}, {"key": "493fa8c40d1bc26ed1d25633c779b13bc33efdba", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.8244619170291395, "ground_truth": 0}, {"key": "493fa8c40d1bc26ed1d25633c779b13bc33efdba", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.8104788925166083, "ground_truth": 0}, {"key": "56d7d67bb0fc32ee71cc006b915244776d883661", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.940353061555049, "ground_truth": 0}, {"key": "56d7d67bb0fc32ee71cc006b915244776d883661", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.90260960545625, "ground_truth": 0}, {"key": "56d7d67bb0fc32ee71cc006b915244776d883661", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.8104789082519943, "ground_truth": 0}, {"key": "56d7d67bb0fc32ee71cc006b915244776d883661", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.8558511463155518, "ground_truth": 0}, {"key": "56d7d67bb0fc32ee71cc006b915244776d883661", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.8322366563780752, "ground_truth": 0}, {"key": "2b08ee205946dc0bb6ffe0db654cbbba1199eb28", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.8714748632666028, "ground_truth": 0}, {"key": "2b08ee205946dc0bb6ffe0db654cbbba1199eb28", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.8856314733189203, "ground_truth": 0}, {"key": "2b08ee205946dc0bb6ffe0db654cbbba1199eb28", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.882427864492817, "ground_truth": 0}, {"key": "2b08ee205946dc0bb6ffe0db654cbbba1199eb28", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.879974371995827, "ground_truth": 0}, {"key": "2b08ee205946dc0bb6ffe0db654cbbba1199eb28", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.8164063804498617, "ground_truth": 0}, {"key": "782c4bdaee73189103d2e05748717b3ea0e89e5d", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.7956581003970201, "ground_truth": 0}, {"key": "782c4bdaee73189103d2e05748717b3ea0e89e5d", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.8895288497660726, "ground_truth": 0}, {"key": "782c4bdaee73189103d2e05748717b3ea0e89e5d", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.7106282871811076, "ground_truth": 0}, {"key": "782c4bdaee73189103d2e05748717b3ea0e89e5d", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.7853085849581014, "ground_truth": 0}, {"key": "782c4bdaee73189103d2e05748717b3ea0e89e5d", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.8529354721816098, "ground_truth": 0}, {"key": "87385fb51ac9eaf76e8421723c94410f724750fc", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.860603622571267, "ground_truth": 0}, {"key": "87385fb51ac9eaf76e8421723c94410f724750fc", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.8221891264916891, "ground_truth": 0}, {"key": "87385fb51ac9eaf76e8421723c94410f724750fc", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.8947894626296017, "ground_truth": 0}, {"key": "87385fb51ac9eaf76e8421723c94410f724750fc", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.8354835485375187, "ground_truth": 0}, {"key": "87385fb51ac9eaf76e8421723c94410f724750fc", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.8558511464528145, "ground_truth": 0}, {"key": "20528eb48341b50c0083fcf5a9d114b39040e5c1", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.8354835436160017, "ground_truth": 0}, {"key": "20528eb48341b50c0083fcf5a9d114b39040e5c1", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.8140528013595489, "ground_truth": 0}, {"key": "20528eb48341b50c0083fcf5a9d114b39040e5c1", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.8449215259212213, "ground_truth": 0}, {"key": "20528eb48341b50c0083fcf5a9d114b39040e5c1", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.7371581498187839, "ground_truth": 0}, {"key": "20528eb48341b50c0083fcf5a9d114b39040e5c1", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.767689837284169, "ground_truth": 0}, {"key": "412630c97420afb50e5278d3406e0cf4b08d0b77", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.8670357605129617, "ground_truth": 0}, {"key": "412630c97420afb50e5278d3406e0cf4b08d0b77", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.687629993502579, "ground_truth": 0}, {"key": "412630c97420afb50e5278d3406e0cf4b08d0b77", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.8558511469409806, "ground_truth": 0}, {"key": "412630c97420afb50e5278d3406e0cf4b08d0b77", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.7325918338387325, "ground_truth": 0}, {"key": "412630c97420afb50e5278d3406e0cf4b08d0b77", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.7233094674345694, "ground_truth": 0}, {"key": "dcd60a85e1e17ec0163a925c9412d480fd08072f", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.8991213892344668, "ground_truth": 0}, {"key": "dcd60a85e1e17ec0163a925c9412d480fd08072f", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.9066531228533334, "ground_truth": 0}, {"key": "dcd60a85e1e17ec0163a925c9412d480fd08072f", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.8670357537223838, "ground_truth": 0}, {"key": "dcd60a85e1e17ec0163a925c9412d480fd08072f", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.7371581455617418, "ground_truth": 0}, {"key": "dcd60a85e1e17ec0163a925c9412d480fd08072f", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.8933094034701325, "ground_truth": 0}, {"key": "805644d370fae7b0492174c54c00e86eff742735", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.8068526321376795, "ground_truth": 0}, {"key": "805644d370fae7b0492174c54c00e86eff742735", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.837619963845763, "ground_truth": 0}, {"key": "805644d370fae7b0492174c54c00e86eff742735", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.8244619352480336, "ground_truth": 0}, {"key": "805644d370fae7b0492174c54c00e86eff742735", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.8092759634691994, "ground_truth": 0}, {"key": "805644d370fae7b0492174c54c00e86eff742735", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.8587185738129545, "ground_truth": 0}, {"key": "3aa0ef8cac31a60076c43a9484792b59372edb64", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.8548846418692635, "ground_truth": 0}, {"key": "3aa0ef8cac31a60076c43a9484792b59372edb64", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.9496693691457972, "ground_truth": 0}, {"key": "3aa0ef8cac31a60076c43a9484792b59372edb64", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.9761291664517174, "ground_truth": 0}, {"key": "3aa0ef8cac31a60076c43a9484792b59372edb64", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.9005297897555898, "ground_truth": 0}, {"key": "3aa0ef8cac31a60076c43a9484792b59372edb64", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.9032942038743316, "ground_truth": 0}, {"key": "4cf51ce9372dff8ff7f44f098eab1c1d7569af7a", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.7431679996339606, "ground_truth": 0}, {"key": "4cf51ce9372dff8ff7f44f098eab1c1d7569af7a", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.9155072461569338, "ground_truth": 0}, {"key": "4cf51ce9372dff8ff7f44f098eab1c1d7569af7a", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.8697145772427735, "ground_truth": 0}, {"key": "4cf51ce9372dff8ff7f44f098eab1c1d7569af7a", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.868826771894821, "ground_truth": 0}, {"key": "4cf51ce9372dff8ff7f44f098eab1c1d7569af7a", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.8469578448885693, "ground_truth": 0}, {"key": "ea06fd0b25cb9793397a51de73fd83f91b4323fa", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.7853085851025622, "ground_truth": 0}, {"key": "ea06fd0b25cb9793397a51de73fd83f91b4323fa", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.8670357460577666, "ground_truth": 0}, {"key": "ea06fd0b25cb9793397a51de73fd83f91b4323fa", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.9124361511658405, "ground_truth": 0}, {"key": "ea06fd0b25cb9793397a51de73fd83f91b4323fa", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.8386797514097197, "ground_truth": 0}, {"key": "ea06fd0b25cb9793397a51de73fd83f91b4323fa", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.8558511509474213, "ground_truth": 0}, {"key": "a150e93fa52eaba281aae9eabe28b3ee4155f296", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.6406358512935649, "ground_truth": 0}, {"key": "a150e93fa52eaba281aae9eabe28b3ee4155f296", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.7233094566115388, "ground_truth": 0}, {"key": "a150e93fa52eaba281aae9eabe28b3ee4155f296", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.8080672228449031, "ground_truth": 0}, {"key": "a150e93fa52eaba281aae9eabe28b3ee4155f296", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.7956580932411755, "ground_truth": 0}, {"key": "a150e93fa52eaba281aae9eabe28b3ee4155f296", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.7154240048316495, "ground_truth": 0}, {"key": "a0a84718168357049273f6e65133fd06e67cd6d2", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.8895288541483714, "ground_truth": 0}, {"key": "a0a84718168357049273f6e65133fd06e67cd6d2", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.8278281584477157, "ground_truth": 0}, {"key": "a0a84718168357049273f6e65133fd06e67cd6d2", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.844921534873121, "ground_truth": 0}, {"key": "a0a84718168357049273f6e65133fd06e67cd6d2", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.862467524390562, "ground_truth": 0}, {"key": "a0a84718168357049273f6e65133fd06e67cd6d2", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.8386797795703034, "ground_truth": 0}, {"key": "b5833a27ee69d7540435e3c70af040c2b743f541", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.5755880010267871, "ground_truth": 0}, {"key": "b5833a27ee69d7540435e3c70af040c2b743f541", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.7416740156891509, "ground_truth": 0}, {"key": "b5833a27ee69d7540435e3c70af040c2b743f541", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.6671476568454197, "ground_truth": 0}, {"key": "b5833a27ee69d7540435e3c70af040c2b743f541", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.6424324810164287, "ground_truth": 0}, {"key": "b5833a27ee69d7540435e3c70af040c2b743f541", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.4960938405402976, "ground_truth": 0}, {"key": "98dbba54da2a05bb04320aa0e4fb05fba3d75b63", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.8116760143975655, "ground_truth": 0}, {"key": "98dbba54da2a05bb04320aa0e4fb05fba3d75b63", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.7853085677049947, "ground_truth": 0}, {"key": "98dbba54da2a05bb04320aa0e4fb05fba3d75b63", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.7563575522241203, "ground_truth": 0}, {"key": "98dbba54da2a05bb04320aa0e4fb05fba3d75b63", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.8397339815922508, "ground_truth": 0}, {"key": "98dbba54da2a05bb04320aa0e4fb05fba3d75b63", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.7090191400514797, "ground_truth": 0}, {"key": "4a30d8e9ba08a56c1d503d719525113545c414e3", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.8128673201391919, "ground_truth": 0}, {"key": "4a30d8e9ba08a56c1d503d719525113545c414e3", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.857768110768767, "ground_truth": 0}, {"key": "4a30d8e9ba08a56c1d503d719525113545c414e3", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.7772998683222392, "ground_truth": 0}, {"key": "4a30d8e9ba08a56c1d503d719525113545c414e3", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.7866228321596338, "ground_truth": 0}, {"key": "4a30d8e9ba08a56c1d503d719525113545c414e3", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.837619968182579, "ground_truth": 0}, {"key": "c3acabb0c18cc7615eb3796406500fba1b148d3d", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.8278281550900537, "ground_truth": 0}, {"key": "c3acabb0c18cc7615eb3796406500fba1b148d3d", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.6842640257373896, "ground_truth": 0}, {"key": "c3acabb0c18cc7615eb3796406500fba1b148d3d", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.7943849465874236, "ground_truth": 0}, {"key": "c3acabb0c18cc7615eb3796406500fba1b148d3d", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.835483552278315, "ground_truth": 0}, {"key": "c3acabb0c18cc7615eb3796406500fba1b148d3d", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.841825651689513, "ground_truth": 0}, {"key": "1c1acc74329fe61636f900df9dbcef5ed695e5c9", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.8688267750437916, "ground_truth": 0}, {"key": "1c1acc74329fe61636f900df9dbcef5ed695e5c9", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.9263037275949243, "ground_truth": 0}, {"key": "1c1acc74329fe61636f900df9dbcef5ed695e5c9", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.9105453962283964, "ground_truth": 0}, {"key": "1c1acc74329fe61636f900df9dbcef5ed695e5c9", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.8976952932213691, "ground_truth": 0}, {"key": "1c1acc74329fe61636f900df9dbcef5ed695e5c9", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.8807970796965305, "ground_truth": 0}, {"key": "f70a7abb6c5b0ef383ea12a4d9ca046a5bd854e5", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.8558511415831492, "ground_truth": 0}, {"key": "f70a7abb6c5b0ef383ea12a4d9ca046a5bd854e5", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.8848377581120944, "ground_truth": 0}, {"key": "f70a7abb6c5b0ef383ea12a4d9ca046a5bd854e5", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.7248702740402697, "ground_truth": 0}, {"key": "f70a7abb6c5b0ef383ea12a4d9ca046a5bd854e5", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.8210441050060822, "ground_truth": 0}, {"key": "f70a7abb6c5b0ef383ea12a4d9ca046a5bd854e5", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.8322366425813243, "ground_truth": 0}, {"key": "a3dd38ec7bc9d7e8423b96d8fd0641a2a5d5c984", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.8895288528472741, "ground_truth": 0}, {"key": "a3dd38ec7bc9d7e8423b96d8fd0641a2a5d5c984", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.9362850049586035, "ground_truth": 0}, {"key": "a3dd38ec7bc9d7e8423b96d8fd0641a2a5d5c984", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.8940517124251405, "ground_truth": 0}, {"key": "a3dd38ec7bc9d7e8423b96d8fd0641a2a5d5c984", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.9381240147839853, "ground_truth": 0}, {"key": "a3dd38ec7bc9d7e8423b96d8fd0641a2a5d5c984", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.8969755776307745, "ground_truth": 0}, {"key": "654c6b29b96d2a5a818d91400c20f838b0e8b6df", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.6909762903892325, "ground_truth": 0}, {"key": "654c6b29b96d2a5a818d91400c20f838b0e8b6df", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.6976089093640429, "ground_truth": 0}, {"key": "654c6b29b96d2a5a818d91400c20f838b0e8b6df", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.7325918380658952, "ground_truth": 0}, {"key": "654c6b29b96d2a5a818d91400c20f838b0e8b6df", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.7620700990832274, "ground_truth": 0}, {"key": "654c6b29b96d2a5a818d91400c20f838b0e8b6df", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.6584175065063332, "ground_truth": 0}, {"key": "764d9ce99a1e3f79d95fbc4b68adbce14e7f8bcd", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.9111797063888116, "ground_truth": 0}, {"key": "764d9ce99a1e3f79d95fbc4b68adbce14e7f8bcd", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.9742394398783646, "ground_truth": 0}, {"key": "764d9ce99a1e3f79d95fbc4b68adbce14e7f8bcd", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.9099070060838941, "ground_truth": 0}, {"key": "764d9ce99a1e3f79d95fbc4b68adbce14e7f8bcd", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.8840392852474067, "ground_truth": 0}, {"key": "764d9ce99a1e3f79d95fbc4b68adbce14e7f8bcd", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.8438951015176429, "ground_truth": 0}, {"key": "f16446db34e2861f0450dfa34d8cdda541ab7b19", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.7732163800853695, "ground_truth": 0}, {"key": "f16446db34e2861f0450dfa34d8cdda541ab7b19", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.8365545682356095, "ground_truth": 0}, {"key": "f16446db34e2861f0450dfa34d8cdda541ab7b19", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.7057850414480317, "ground_truth": 0}, {"key": "f16446db34e2861f0450dfa34d8cdda541ab7b19", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.6706082848991892, "ground_truth": 0}, {"key": "f16446db34e2861f0450dfa34d8cdda541ab7b19", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.7154239865996143, "ground_truth": 0}, {"key": "3e910c5b8425cd7c871a402a32ca44680b53ce5e", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.7563575546254564, "ground_truth": 0}, {"key": "3e910c5b8425cd7c871a402a32ca44680b53ce5e", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.8449215384300371, "ground_truth": 0}, {"key": "3e910c5b8425cd7c871a402a32ca44680b53ce5e", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.5621764911627603, "ground_truth": 0}, {"key": "3e910c5b8425cd7c871a402a32ca44680b53ce5e", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.6791786832399288, "ground_truth": 0}, {"key": "3e910c5b8425cd7c871a402a32ca44680b53ce5e", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.7634837687209167, "ground_truth": 0}, {"key": "973c14551fc97a1eef094bd0f33356d9e6836234", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.8925625220658716, "ground_truth": 0}, {"key": "973c14551fc97a1eef094bd0f33356d9e6836234", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.8991213751517351, "ground_truth": 0}, {"key": "973c14551fc97a1eef094bd0f33356d9e6836234", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.8233283884557627, "ground_truth": 0}, {"key": "973c14551fc97a1eef094bd0f33356d9e6836234", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.8548846414595287, "ground_truth": 0}, {"key": "973c14551fc97a1eef094bd0f33356d9e6836234", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.8428631507580449, "ground_truth": 0}, {"key": "725938611c7dca6f876ada93b1d68b29ad25ce38", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.8397339718199223, "ground_truth": 0}, {"key": "725938611c7dca6f876ada93b1d68b29ad25ce38", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.8289388132986922, "ground_truth": 0}, {"key": "725938611c7dca6f876ada93b1d68b29ad25ce38", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.8925625287768251, "ground_truth": 0}, {"key": "725938611c7dca6f876ada93b1d68b29ad25ce38", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.7981867823772961, "ground_truth": 0}, {"key": "725938611c7dca6f876ada93b1d68b29ad25ce38", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.6601723726097412, "ground_truth": 0}, {"key": "28dbcf0c8624d9914a4e4292f872f17b063547c2", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.9788748053940184, "ground_truth": 0}, {"key": "28dbcf0c8624d9914a4e4292f872f17b063547c2", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.9683812354499195, "ground_truth": 0}, {"key": "28dbcf0c8624d9914a4e4292f872f17b063547c2", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.9746286903143673, "ground_truth": 0}, {"key": "28dbcf0c8624d9914a4e4292f872f17b063547c2", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.979035759450252, "ground_truth": 0}, {"key": "28dbcf0c8624d9914a4e4292f872f17b063547c2", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.9697854094488744, "ground_truth": 0}, {"key": "4567b2098569ee4346cfdede5819257af4ee9c0f", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.8397339669440442, "ground_truth": 0}, {"key": "4567b2098569ee4346cfdede5819257af4ee9c0f", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.8976952947560143, "ground_truth": 0}, {"key": "4567b2098569ee4346cfdede5819257af4ee9c0f", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.8539127515618467, "ground_truth": 0}, {"key": "4567b2098569ee4346cfdede5819257af4ee9c0f", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.8577681156994525, "ground_truth": 0}, {"key": "4567b2098569ee4346cfdede5819257af4ee9c0f", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.911809955566239, "ground_truth": 0}, {"key": "d0404188997ef57e0355b18fb867599b89c80407", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.8300437726882828, "ground_truth": 0}, {"key": "d0404188997ef57e0355b18fb867599b89c80407", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.8705972627495824, "ground_truth": 0}, {"key": "d0404188997ef57e0355b18fb867599b89c80407", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.8615382074163245, "ground_truth": 0}, {"key": "d0404188997ef57e0355b18fb867599b89c80407", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.8723473603878827, "ground_truth": 0}, {"key": "d0404188997ef57e0355b18fb867599b89c80407", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.8633916154785061, "ground_truth": 0}, {"key": "ab10b3f8c4a6cca7aea94298447b13bc0721fe69", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.8749346215839506, "ground_truth": 0}, {"key": "ab10b3f8c4a6cca7aea94298447b13bc0721fe69", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.9092645131182847, "ground_truth": 0}, {"key": "ab10b3f8c4a6cca7aea94298447b13bc0721fe69", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.9390248175016442, "ground_truth": 0}, {"key": "ab10b3f8c4a6cca7aea94298447b13bc0721fe69", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.9700134931595389, "ground_truth": 0}, {"key": "ab10b3f8c4a6cca7aea94298447b13bc0721fe69", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.9353465070761949, "ground_truth": 0}, {"key": "7c11a3353593edde95bae0ee6178fb1d1855baed", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.6842640215296778, "ground_truth": 0}, {"key": "7c11a3353593edde95bae0ee6178fb1d1855baed", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.8344068863066599, "ground_truth": 0}, {"key": "7c11a3353593edde95bae0ee6178fb1d1855baed", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.5698526588032249, "ground_truth": 0}, {"key": "7c11a3353593edde95bae0ee6178fb1d1855baed", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.8164063725511793, "ground_truth": 0}, {"key": "7c11a3353593edde95bae0ee6178fb1d1855baed", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.705785025476493, "ground_truth": 0}, {"key": "487b272b94a620f9660e89bbf6ebab3ffdf1bf06", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.7476159775284978, "ground_truth": 0}, {"key": "487b272b94a620f9660e89bbf6ebab3ffdf1bf06", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.7839884738922945, "ground_truth": 0}, {"key": "487b272b94a620f9660e89bbf6ebab3ffdf1bf06", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.7401743619661748, "ground_truth": 0}, {"key": "487b272b94a620f9660e89bbf6ebab3ffdf1bf06", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.4843800918311975, "ground_truth": 0}, {"key": "487b272b94a620f9660e89bbf6ebab3ffdf1bf06", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.6757646043417866, "ground_truth": 0}, {"key": "e1b6f4701835710d3f518729188754fcd7061289", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.9294404015302238, "ground_truth": 0}, {"key": "e1b6f4701835710d3f518729188754fcd7061289", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.8333246003979166, "ground_truth": 0}, {"key": "e1b6f4701835710d3f518729188754fcd7061289", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.7106282984363518, "ground_truth": 0}, {"key": "e1b6f4701835710d3f518729188754fcd7061289", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.8670357556715684, "ground_truth": 0}, {"key": "e1b6f4701835710d3f518729188754fcd7061289", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.9111797076466022, "ground_truth": 0}, {"key": "45027afbe54056c567ca8a48906dd06200f6d8c1", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.96691402198757, "ground_truth": 0}, {"key": "45027afbe54056c567ca8a48906dd06200f6d8c1", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.9629528311329616, "ground_truth": 0}, {"key": "45027afbe54056c567ca8a48906dd06200f6d8c1", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.8925625215184385, "ground_truth": 0}, {"key": "45027afbe54056c567ca8a48906dd06200f6d8c1", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.9053222902323251, "ground_truth": 0}, {"key": "45027afbe54056c567ca8a48906dd06200f6d8c1", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.9726235111566918, "ground_truth": 0}, {"key": "e8c2d4a1d20efb0606506435ebcbf486e9eb4146", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.9026096038095817, "ground_truth": 0}, {"key": "e8c2d4a1d20efb0606506435ebcbf486e9eb4146", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.8509646941288821, "ground_truth": 0}, {"key": "e8c2d4a1d20efb0606506435ebcbf486e9eb4146", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.8529354671597849, "ground_truth": 0}, {"key": "e8c2d4a1d20efb0606506435ebcbf486e9eb4146", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.7786493158925128, "ground_truth": 0}, {"key": "e8c2d4a1d20efb0606506435ebcbf486e9eb4146", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.8407825978633253, "ground_truth": 0}, {"key": "da0ea6b7eae20528c7ec822fb77d8e8f78ba09b8", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.7943849531470167, "ground_truth": 0}, {"key": "da0ea6b7eae20528c7ec822fb77d8e8f78ba09b8", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.8068526388805605, "ground_truth": 0}, {"key": "da0ea6b7eae20528c7ec822fb77d8e8f78ba09b8", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.7201714939078668, "ground_truth": 0}, {"key": "da0ea6b7eae20528c7ec822fb77d8e8f78ba09b8", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.826711793176398, "ground_truth": 0}, {"key": "da0ea6b7eae20528c7ec822fb77d8e8f78ba09b8", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.8333245930552944, "ground_truth": 0}, {"key": "42ab0385b3bb93236804c2abc9ff261b6ec79872", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.8255897197829903, "ground_truth": 0}, {"key": "42ab0385b3bb93236804c2abc9ff261b6ec79872", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.7248702864187915, "ground_truth": 0}, {"key": "42ab0385b3bb93236804c2abc9ff261b6ec79872", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.8198933396459668, "ground_truth": 0}, {"key": "42ab0385b3bb93236804c2abc9ff261b6ec79872", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.7217432212063577, "ground_truth": 0}, {"key": "42ab0385b3bb93236804c2abc9ff261b6ec79872", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.6406358432325668, "ground_truth": 0}, {"key": "3ad31f0dd26f2dce06da1c10ced8d601bd5594c5", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.5544704494836681, "ground_truth": 0}, {"key": "3ad31f0dd26f2dce06da1c10ced8d601bd5594c5", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.7057850383436379, "ground_truth": 0}, {"key": "3ad31f0dd26f2dce06da1c10ced8d601bd5594c5", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.8187367975312773, "ground_truth": 0}, {"key": "3ad31f0dd26f2dce06da1c10ced8d601bd5594c5", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.40733341112808974, "ground_truth": 0}, {"key": "3ad31f0dd26f2dce06da1c10ced8d601bd5594c5", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.29098086572462856, "ground_truth": 0}, {"key": "a142b867b5b52449a790e8a2942654fd880cd2e4", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.9416541602144456, "ground_truth": 0}, {"key": "a142b867b5b52449a790e8a2942654fd880cd2e4", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.9005297937294686, "ground_truth": 0}, {"key": "a142b867b5b52449a790e8a2942654fd880cd2e4", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.9235923176332439, "ground_truth": 0}, {"key": "a142b867b5b52449a790e8a2942654fd880cd2e4", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.8643104462640644, "ground_truth": 0}, {"key": "a142b867b5b52449a790e8a2942654fd880cd2e4", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.9252299522157718, "ground_truth": 0}, {"key": "04b39ee42fdc4284e402fbf7cdc7b825748f38b5", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.9492946372539581, "ground_truth": 0}, {"key": "04b39ee42fdc4284e402fbf7cdc7b825748f38b5", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.8984105624401028, "ground_truth": 0}, {"key": "04b39ee42fdc4284e402fbf7cdc7b825748f38b5", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.9329437099306107, "ground_truth": 0}, {"key": "04b39ee42fdc4284e402fbf7cdc7b825748f38b5", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.9207896748256277, "ground_truth": 0}, {"key": "04b39ee42fdc4284e402fbf7cdc7b825748f38b5", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.9724147184306293, "ground_truth": 0}, {"key": "ddafab36467762e9f1856687a7ef0e801243dace", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.6992544093090022, "ground_truth": 0}, {"key": "ddafab36467762e9f1856687a7ef0e801243dace", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.8918110383075829, "ground_truth": 0}, {"key": "ddafab36467762e9f1856687a7ef0e801243dace", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.7401743438177558, "ground_truth": 0}, {"key": "ddafab36467762e9f1856687a7ef0e801243dace", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.8221891301783144, "ground_truth": 0}, {"key": "ddafab36467762e9f1856687a7ef0e801243dace", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.7662936454947898, "ground_truth": 0}, {"key": "6c177720c8623edcaefc45111018f98811c29693", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.8499711760952228, "ground_truth": 0}, {"key": "6c177720c8623edcaefc45111018f98811c29693", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.9339146263188468, "ground_truth": 0}, {"key": "6c177720c8623edcaefc45111018f98811c29693", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.9184802455993574, "ground_truth": 0}, {"key": "6c177720c8623edcaefc45111018f98811c29693", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.9167080732782685, "ground_truth": 0}, {"key": "6c177720c8623edcaefc45111018f98811c29693", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.8198933419154136, "ground_truth": 0}, {"key": "5365dfc7c7079ade7d090530f5ce0d8995a8f1cc", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.909264517088571, "ground_truth": 0}, {"key": "5365dfc7c7079ade7d090530f5ce0d8995a8f1cc", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.8969755714152714, "ground_truth": 0}, {"key": "5365dfc7c7079ade7d090530f5ce0d8995a8f1cc", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.9136765211071184, "ground_truth": 0}, {"key": "5365dfc7c7079ade7d090530f5ce0d8995a8f1cc", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.9059898104717289, "ground_truth": 0}, {"key": "5365dfc7c7079ade7d090530f5ce0d8995a8f1cc", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.8918110403367308, "ground_truth": 0}, {"key": "6235695e9e69aa35c488636fc63bae84d1e2ca1f", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.8615382053048996, "ground_truth": 0}, {"key": "6235695e9e69aa35c488636fc63bae84d1e2ca1f", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.713830738260751, "ground_truth": 0}, {"key": "6235695e9e69aa35c488636fc63bae84d1e2ca1f", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.743167996908814, "ground_truth": 0}, {"key": "6235695e9e69aa35c488636fc63bae84d1e2ca1f", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.8519528169794722, "ground_truth": 0}, {"key": "6235695e9e69aa35c488636fc63bae84d1e2ca1f", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.7931059419226418, "ground_truth": 0}, {"key": "d954f33da49f4c839a6f4dadc446a4c30328c572", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.8955226838368738, "ground_truth": 0}, {"key": "d954f33da49f4c839a6f4dadc446a4c30328c572", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.9252299536427211, "ground_truth": 0}, {"key": "d954f33da49f4c839a6f4dadc446a4c30328c572", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.9079671360742981, "ground_truth": 0}, {"key": "d954f33da49f4c839a6f4dadc446a4c30328c572", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.8624675277302061, "ground_truth": 0}, {"key": "d954f33da49f4c839a6f4dadc446a4c30328c572", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.9202179877859217, "ground_truth": 0}, {"key": "5bdab1456ce6156a7378edaa4fa92a718cbf2568", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.8732148223133409, "ground_truth": 0}, {"key": "5bdab1456ce6156a7378edaa4fa92a718cbf2568", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.8365545608147414, "ground_truth": 0}, {"key": "5bdab1456ce6156a7378edaa4fa92a718cbf2568", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.7690802411534444, "ground_truth": 0}, {"key": "5bdab1456ce6156a7378edaa4fa92a718cbf2568", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.7476159615827603, "ground_truth": 0}, {"key": "5bdab1456ce6156a7378edaa4fa92a718cbf2568", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.8438951007837772, "ground_truth": 0}, {"key": "c03cd67baa8d84240b962876a5aaa2036d4f5275", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.6460136942917318, "ground_truth": 0}, {"key": "c03cd67baa8d84240b962876a5aaa2036d4f5275", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.7476159473346631, "ground_truth": 0}, {"key": "c03cd67baa8d84240b962876a5aaa2036d4f5275", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.7248702835797634, "ground_truth": 0}, {"key": "c03cd67baa8d84240b962876a5aaa2036d4f5275", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.789233700300877, "ground_truth": 0}, {"key": "c03cd67baa8d84240b962876a5aaa2036d4f5275", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.8519528056400596, "ground_truth": 0}, {"key": "e2847808e1990f51cd54eccd660640c44638f088", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.3106943867819604, "ground_truth": 0}, {"key": "e2847808e1990f51cd54eccd660640c44638f088", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.5506073689908234, "ground_truth": 0}, {"key": "e2847808e1990f51cd54eccd660640c44638f088", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.6740504667825116, "ground_truth": 0}, {"key": "e2847808e1990f51cd54eccd660640c44638f088", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.7461389867659236, "ground_truth": 0}, {"key": "e2847808e1990f51cd54eccd660640c44638f088", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.661922852268082, "ground_truth": 0}, {"key": "fbc2d5f3f088eda2b8128ebb12a042850f6e4f3d", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.9012274116520764, "ground_truth": 0}, {"key": "fbc2d5f3f088eda2b8128ebb12a042850f6e4f3d", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.8872045976995926, "ground_truth": 0}, {"key": "fbc2d5f3f088eda2b8128ebb12a042850f6e4f3d", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.8714748660797074, "ground_truth": 0}, {"key": "fbc2d5f3f088eda2b8128ebb12a042850f6e4f3d", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.9059898123526029, "ground_truth": 0}, {"key": "fbc2d5f3f088eda2b8128ebb12a042850f6e4f3d", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.8910549558839584, "ground_truth": 0}, {"key": "6f0d219aba6227e0a69e71e7fca4b85ae761101d", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.7918210712534967, "ground_truth": 0}, {"key": "6f0d219aba6227e0a69e71e7fca4b85ae761101d", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.9219218366255315, "ground_truth": 0}, {"key": "6f0d219aba6227e0a69e71e7fca4b85ae761101d", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.8807970792997017, "ground_truth": 0}, {"key": "6f0d219aba6227e0a69e71e7fca4b85ae761101d", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.8479677548065813, "ground_truth": 0}, {"key": "6f0d219aba6227e0a69e71e7fca4b85ae761101d", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.8128673097843412, "ground_truth": 0}, {"key": "8c71492f2a3fbe7eb9c8205d65054ab14c1dbdb6", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.8187367929809943, "ground_truth": 0}, {"key": "8c71492f2a3fbe7eb9c8205d65054ab14c1dbdb6", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.9053222985007494, "ground_truth": 0}, {"key": "8c71492f2a3fbe7eb9c8205d65054ab14c1dbdb6", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.9376689595531473, "ground_truth": 0}, {"key": "8c71492f2a3fbe7eb9c8205d65054ab14c1dbdb6", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.9005297880330169, "ground_truth": 0}, {"key": "8c71492f2a3fbe7eb9c8205d65054ab14c1dbdb6", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.8947894672734905, "ground_truth": 0}, {"key": "860cea3a6afb8527d26e9234ccba560a39eff2a7", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.9477691452930168, "ground_truth": 0}, {"key": "860cea3a6afb8527d26e9234ccba560a39eff2a7", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.8509646974027402, "ground_truth": 0}, {"key": "860cea3a6afb8527d26e9234ccba560a39eff2a7", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.93343080929347, "ground_truth": 0}, {"key": "860cea3a6afb8527d26e9234ccba560a39eff2a7", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.9130583443987713, "ground_truth": 0}, {"key": "860cea3a6afb8527d26e9234ccba560a39eff2a7", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.8152324819914614, "ground_truth": 0}, {"key": "0914e3c80a676e14e225504cb759103503f3f1e0", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.9155072459056219, "ground_truth": 0}, {"key": "0914e3c80a676e14e225504cb759103503f3f1e0", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.9289263320162864, "ground_truth": 0}, {"key": "0914e3c80a676e14e225504cb759103503f3f1e0", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.8991213798515506, "ground_truth": 0}, {"key": "0914e3c80a676e14e225504cb759103503f3f1e0", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.7648916127211756, "ground_truth": 0}, {"key": "0914e3c80a676e14e225504cb759103503f3f1e0", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.7931059542743898, "ground_truth": 0}, {"key": "82a0e1f034174079179821b052f33df76c781b47", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.8300437583254974, "ground_truth": 0}, {"key": "82a0e1f034174079179821b052f33df76c781b47", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.865224074137285, "ground_truth": 0}, {"key": "82a0e1f034174079179821b052f33df76c781b47", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.8887587844127964, "ground_truth": 0}, {"key": "82a0e1f034174079179821b052f33df76c781b47", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.9124361526536577, "ground_truth": 0}, {"key": "82a0e1f034174079179821b052f33df76c781b47", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.879974373334597, "ground_truth": 0}, {"key": "449c536051eba7070b18a7b33ebcf024891cb913", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.9124361598983461, "ground_truth": 0}, {"key": "449c536051eba7070b18a7b33ebcf024891cb913", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.8558511486877528, "ground_truth": 0}, {"key": "449c536051eba7070b18a7b33ebcf024891cb913", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.9504109752956155, "ground_truth": 0}, {"key": "449c536051eba7070b18a7b33ebcf024891cb913", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.7634837531492676, "ground_truth": 0}, {"key": "449c536051eba7070b18a7b33ebcf024891cb913", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.7813306297658019, "ground_truth": 0}, {"key": "696d5716c42ab1096cdb464da3cfcf702626a62a", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.9603611599624492, "ground_truth": 0}, {"key": "696d5716c42ab1096cdb464da3cfcf702626a62a", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.9790357589956473, "ground_truth": 0}, {"key": "696d5716c42ab1096cdb464da3cfcf702626a62a", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.9706877692107926, "ground_truth": 0}, {"key": "696d5716c42ab1096cdb464da3cfcf702626a62a", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.9324533029540223, "ground_truth": 0}, {"key": "696d5716c42ab1096cdb464da3cfcf702626a62a", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.9759464451854426, "ground_truth": 0}, {"key": "316f0f847800fdb547f7496f6095075cd610c7e4", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.969555648732157, "ground_truth": 0}, {"key": "316f0f847800fdb547f7496f6095075cd610c7e4", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.9909447355874579, "ground_truth": 0}, {"key": "316f0f847800fdb547f7496f6095075cd610c7e4", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.966410490704421, "ground_truth": 0}, {"key": "316f0f847800fdb547f7496f6095075cd610c7e4", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.9748211563013263, "ground_truth": 0}, {"key": "316f0f847800fdb547f7496f6095075cd610c7e4", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.9549844656487187, "ground_truth": 0}, {"key": "28e251ea722829df08d63e83824110fedcc13f8c", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.8840392841330608, "ground_truth": 0}, {"key": "28e251ea722829df08d63e83824110fedcc13f8c", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.89912137566525, "ground_truth": 0}, {"key": "28e251ea722829df08d63e83824110fedcc13f8c", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.8652240769663274, "ground_truth": 0}, {"key": "28e251ea722829df08d63e83824110fedcc13f8c", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.7956581000734216, "ground_truth": 0}, {"key": "28e251ea722829df08d63e83824110fedcc13f8c", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.8198933346851092, "ground_truth": 0}, {"key": "4812698545d6a4c2243db340fad08d0b3b7fbe0b", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.8679338444088969, "ground_truth": 0}, {"key": "4812698545d6a4c2243db340fad08d0b3b7fbe0b", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.8233283863841337, "ground_truth": 0}, {"key": "4812698545d6a4c2243db340fad08d0b3b7fbe0b", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.8539127457754956, "ground_truth": 0}, {"key": "4812698545d6a4c2243db340fad08d0b3b7fbe0b", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.6876299933137322, "ground_truth": 0}, {"key": "4812698545d6a4c2243db340fad08d0b3b7fbe0b", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.9032942128426511, "ground_truth": 0}, {"key": "81651fc015f2db10f24327d11b1a3748a19466f9", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.7170118866671574, "ground_truth": 0}, {"key": "81651fc015f2db10f24327d11b1a3748a19466f9", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.8407826083617839, "ground_truth": 0}, {"key": "81651fc015f2db10f24327d11b1a3748a19466f9", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.7295197700192267, "ground_truth": 0}, {"key": "81651fc015f2db10f24327d11b1a3748a19466f9", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.8255897129647538, "ground_truth": 0}, {"key": "81651fc015f2db10f24327d11b1a3748a19466f9", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.7520125703552022, "ground_truth": 0}, {"key": "f85e12129885fad0eabd6a1c6b6b24dbf8948db5", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.8376199761865142, "ground_truth": 0}, {"key": "f85e12129885fad0eabd6a1c6b6b24dbf8948db5", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.8895288524963549, "ground_truth": 0}, {"key": "f85e12129885fad0eabd6a1c6b6b24dbf8948db5", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.8311430436580025, "ground_truth": 0}, {"key": "f85e12129885fad0eabd6a1c6b6b24dbf8948db5", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.7866228324747505, "ground_truth": 0}, {"key": "f85e12129885fad0eabd6a1c6b6b24dbf8948db5", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.8766343844331927, "ground_truth": 0}, {"key": "bffa402002700855fec36f83c8c226dfe271a6af", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.8300437653113556, "ground_truth": 0}, {"key": "bffa402002700855fec36f83c8c226dfe271a6af", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.8428631443430389, "ground_truth": 0}, {"key": "bffa402002700855fec36f83c8c226dfe271a6af", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.795658083777295, "ground_truth": 0}, {"key": "bffa402002700855fec36f83c8c226dfe271a6af", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.8606036153963132, "ground_truth": 0}, {"key": "bffa402002700855fec36f83c8c226dfe271a6af", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.6959583331098897, "ground_truth": 0}, {"key": "360df256327edcaf7ce0b99314adec8b0a2c5be6", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.9005297889876829, "ground_truth": 0}, {"key": "360df256327edcaf7ce0b99314adec8b0a2c5be6", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.9412234432892962, "ground_truth": 0}, {"key": "360df256327edcaf7ce0b99314adec8b0a2c5be6", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.8918110474126943, "ground_truth": 0}, {"key": "360df256327edcaf7ce0b99314adec8b0a2c5be6", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.8807970824415692, "ground_truth": 0}, {"key": "360df256327edcaf7ce0b99314adec8b0a2c5be6", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.903294214261229, "ground_truth": 0}, {"key": "35ae4229bbd571d86bb817df03b3784dc8cbf660", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.8670357524204252, "ground_truth": 0}, {"key": "35ae4229bbd571d86bb817df03b3784dc8cbf660", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.9005297935383951, "ground_truth": 0}, {"key": "35ae4229bbd571d86bb817df03b3784dc8cbf660", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.8783142449407161, "ground_truth": 0}, {"key": "35ae4229bbd571d86bb817df03b3784dc8cbf660", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.9202179877774729, "ground_truth": 0}, {"key": "35ae4229bbd571d86bb817df03b3784dc8cbf660", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.9241418241660393, "ground_truth": 0}, {"key": "fd93b423a3805de1c259d527393fd5fb75d06a55", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.8714748617097908, "ground_truth": 0}, {"key": "fd93b423a3805de1c259d527393fd5fb75d06a55", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.795658087761093, "ground_truth": 0}, {"key": "fd93b423a3805de1c259d527393fd5fb75d06a55", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.8344068787373073, "ground_truth": 0}, {"key": "fd93b423a3805de1c259d527393fd5fb75d06a55", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.8832359939799577, "ground_truth": 0}, {"key": "fd93b423a3805de1c259d527393fd5fb75d06a55", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.8661325119614323, "ground_truth": 0}, {"key": "646676aabe72e75add3cde2d6afa56cea64c91a4", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.8998277861639478, "ground_truth": 0}, {"key": "646676aabe72e75add3cde2d6afa56cea64c91a4", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.9445872076008026, "ground_truth": 0}, {"key": "646676aabe72e75add3cde2d6afa56cea64c91a4", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.9314625052717105, "ground_truth": 0}, {"key": "646676aabe72e75add3cde2d6afa56cea64c91a4", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.8688267739401705, "ground_truth": 0}, {"key": "646676aabe72e75add3cde2d6afa56cea64c91a4", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.9263037265703934, "ground_truth": 0}, {"key": "5acf12b2ef7771fd1cd1421acb7057d9a64be818", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.8479677528783419, "ground_truth": 0}, {"key": "5acf12b2ef7771fd1cd1421acb7057d9a64be818", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.9465966699661312, "ground_truth": 0}, {"key": "5acf12b2ef7771fd1cd1421acb7057d9a64be818", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.9309620686885992, "ground_truth": 0}, {"key": "5acf12b2ef7771fd1cd1421acb7057d9a64be818", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.8714748665493378, "ground_truth": 0}, {"key": "5acf12b2ef7771fd1cd1421acb7057d9a64be818", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.9105454029083708, "ground_truth": 0}, {"key": "0239342f05436085947bd0c5173a4636ee772b51", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.7981867781652735, "ground_truth": 0}, {"key": "0239342f05436085947bd0c5173a4636ee772b51", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.7401743420589377, "ground_truth": 0}, {"key": "0239342f05436085947bd0c5173a4636ee772b51", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.7074046870800156, "ground_truth": 0}, {"key": "0239342f05436085947bd0c5173a4636ee772b51", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.7718434996392807, "ground_truth": 0}, {"key": "0239342f05436085947bd0c5173a4636ee772b51", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.8019358238744507, "ground_truth": 0}, {"key": "1f40e358077ff22078a4e91e5114c4f86a4d52db", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.848972189676145, "ground_truth": 0}, {"key": "1f40e358077ff22078a4e91e5114c4f86a4d52db", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.8397339698821833, "ground_truth": 0}, {"key": "1f40e358077ff22078a4e91e5114c4f86a4d52db", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.8068526270949452, "ground_truth": 0}, {"key": "1f40e358077ff22078a4e91e5114c4f86a4d52db", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.9099070017278262, "ground_truth": 0}, {"key": "1f40e358077ff22078a4e91e5114c4f86a4d52db", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.8489722003203336, "ground_truth": 0}, {"key": "a8ac682f29acaad4b669781c39fb2804374b8b2b", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.6723317233250422, "ground_truth": 0}, {"key": "a8ac682f29acaad4b669781c39fb2804374b8b2b", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.7866228100885486, "ground_truth": 0}, {"key": "a8ac682f29acaad4b669781c39fb2804374b8b2b", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.8438951020237625, "ground_truth": 0}, {"key": "a8ac682f29acaad4b669781c39fb2804374b8b2b", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.8519528023125941, "ground_truth": 0}, {"key": "a8ac682f29acaad4b669781c39fb2804374b8b2b", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.660172372076222, "ground_truth": 0}, {"key": "d4474ce9da725c1540ac826f3247f53d086808fb", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.7620701134062915, "ground_truth": 0}, {"key": "d4474ce9da725c1540ac826f3247f53d086808fb", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.8558511499801357, "ground_truth": 0}, {"key": "d4474ce9da725c1540ac826f3247f53d086808fb", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.8221891265246095, "ground_truth": 0}, {"key": "d4474ce9da725c1540ac826f3247f53d086808fb", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.8832359825096867, "ground_truth": 0}, {"key": "d4474ce9da725c1540ac826f3247f53d086808fb", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.8740772274847688, "ground_truth": 0}, {"key": "e74db6d20c456740ecb7b295c8d24489fb4f436f", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.8774767924351867, "ground_truth": 0}, {"key": "e74db6d20c456740ecb7b295c8d24489fb4f436f", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.8489721916529034, "ground_truth": 0}, {"key": "e74db6d20c456740ecb7b295c8d24489fb4f436f", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.7799929064614181, "ground_truth": 0}, {"key": "e74db6d20c456740ecb7b295c8d24489fb4f436f", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.851952808869902, "ground_truth": 0}, {"key": "e74db6d20c456740ecb7b295c8d24489fb4f436f", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.8872046033804102, "ground_truth": 0}, {"key": "d79b790edcc3f5088161445102a656ae4adb8ab1", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.9309620723089134, "ground_truth": 0}, {"key": "d79b790edcc3f5088161445102a656ae4adb8ab1", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.9536217936251391, "ground_truth": 0}, {"key": "d79b790edcc3f5088161445102a656ae4adb8ab1", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.9643214463656099, "ground_truth": 0}, {"key": "d79b790edcc3f5088161445102a656ae4adb8ab1", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.8807970610342836, "ground_truth": 0}, {"key": "d79b790edcc3f5088161445102a656ae4adb8ab1", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.9278877996935256, "ground_truth": 0}, {"key": "47f028dbf53e028eb6636c85d8b3ee0de6a1de7b", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.8824278743392117, "ground_truth": 0}, {"key": "47f028dbf53e028eb6636c85d8b3ee0de6a1de7b", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.867035771394508, "ground_truth": 0}, {"key": "47f028dbf53e028eb6636c85d8b3ee0de6a1de7b", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.8925625256626192, "ground_truth": 0}, {"key": "47f028dbf53e028eb6636c85d8b3ee0de6a1de7b", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.8816149068453708, "ground_truth": 0}, {"key": "47f028dbf53e028eb6636c85d8b3ee0de6a1de7b", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.9149009566054649, "ground_truth": 0}, {"key": "5f7a869908e864b70e83282b289ed1274c1f7f0d", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.5292634007106017, "ground_truth": 0}, {"key": "5f7a869908e864b70e83282b289ed1274c1f7f0d", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.8152324887134669, "ground_truth": 0}, {"key": "5f7a869908e864b70e83282b289ed1274c1f7f0d", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.7813306289959975, "ground_truth": 0}, {"key": "5f7a869908e864b70e83282b289ed1274c1f7f0d", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.7662936412527651, "ground_truth": 0}, {"key": "5f7a869908e864b70e83282b289ed1274c1f7f0d", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.6242935457382386, "ground_truth": 0}, {"key": "59a9e7cad1c4c873738dda62b7e7b39bc2553710", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.7248702729867746, "ground_truth": 0}, {"key": "59a9e7cad1c4c873738dda62b7e7b39bc2553710", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.6893055980557434, "ground_truth": 0}, {"key": "59a9e7cad1c4c873738dda62b7e7b39bc2553710", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.8615382169360469, "ground_truth": 0}, {"key": "59a9e7cad1c4c873738dda62b7e7b39bc2553710", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.6297746104839685, "ground_truth": 0}, {"key": "59a9e7cad1c4c873738dda62b7e7b39bc2553710", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.6388352796606541, "ground_truth": 0}, {"key": "c47db89f5f9de3e599e2947ab7940eb65be0b433", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.8697145741919226, "ground_truth": 0}, {"key": "c47db89f5f9de3e599e2947ab7940eb65be0b433", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.9118099503850537, "ground_truth": 0}, {"key": "c47db89f5f9de3e599e2947ab7940eb65be0b433", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.8080672044892545, "ground_truth": 0}, {"key": "c47db89f5f9de3e599e2947ab7940eb65be0b433", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.9012274067098841, "ground_truth": 0}, {"key": "c47db89f5f9de3e599e2947ab7940eb65be0b433", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.9284087999446287, "ground_truth": 0}, {"key": "a74c3ff540cb154fc1294fd9d48b6a952329722b", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.7264256100121663, "ground_truth": 0}, {"key": "a74c3ff540cb154fc1294fd9d48b6a952329722b", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.874077236029327, "ground_truth": 0}, {"key": "a74c3ff540cb154fc1294fd9d48b6a952329722b", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.7799929061835401, "ground_truth": 0}, {"key": "a74c3ff540cb154fc1294fd9d48b6a952329722b", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.8459424388675444, "ground_truth": 0}, {"key": "a74c3ff540cb154fc1294fd9d48b6a952329722b", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.8799743636541719, "ground_truth": 0}, {"key": "f5692f8e01389a631dadcb70cfd4be3ff0ae45d3", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.9453993937516381, "ground_truth": 0}, {"key": "f5692f8e01389a631dadcb70cfd4be3ff0ae45d3", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.9353465080716605, "ground_truth": 0}, {"key": "f5692f8e01389a631dadcb70cfd4be3ff0ae45d3", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.8757869950871295, "ground_truth": 0}, {"key": "f5692f8e01389a631dadcb70cfd4be3ff0ae45d3", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.8887587854240138, "ground_truth": 0}, {"key": "f5692f8e01389a631dadcb70cfd4be3ff0ae45d3", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.9032942078461059, "ground_truth": 0}, {"key": "467e1b592518a5660d0a3b7eda24ef9574fe0d11", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.8856314664189877, "ground_truth": 0}, {"key": "467e1b592518a5660d0a3b7eda24ef9574fe0d11", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.893309402372116, "ground_truth": 0}, {"key": "467e1b592518a5660d0a3b7eda24ef9574fe0d11", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.8679338486634529, "ground_truth": 0}, {"key": "467e1b592518a5660d0a3b7eda24ef9574fe0d11", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.8596637500501964, "ground_truth": 0}, {"key": "467e1b592518a5660d0a3b7eda24ef9574fe0d11", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.8479677562877856, "ground_truth": 0}, {"key": "61acf6de75325370728f6e290bafb01adc24a3ca", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.7310585852756736, "ground_truth": 0}, {"key": "61acf6de75325370728f6e290bafb01adc24a3ca", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.6187804270337424, "ground_truth": 0}, {"key": "61acf6de75325370728f6e290bafb01adc24a3ca", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.6654105625547946, "ground_truth": 0}, {"key": "61acf6de75325370728f6e290bafb01adc24a3ca", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.6388352811048335, "ground_truth": 0}, {"key": "61acf6de75325370728f6e290bafb01adc24a3ca", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.6893056210019068, "ground_truth": 0}, {"key": "172d2668b011501c20181b4925ebb6ba582f9a2f", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.8679338477150991, "ground_truth": 0}, {"key": "172d2668b011501c20181b4925ebb6ba582f9a2f", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.8267117906504853, "ground_truth": 0}, {"key": "172d2668b011501c20181b4925ebb6ba582f9a2f", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.8210440999511126, "ground_truth": 0}, {"key": "172d2668b011501c20181b4925ebb6ba582f9a2f", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.7892337069100497, "ground_truth": 0}, {"key": "172d2668b011501c20181b4925ebb6ba582f9a2f", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.9092645171780722, "ground_truth": 0}, {"key": "314c7c0104eb4113074619b3b3f1e9356114e2f5", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.8596637461698584, "ground_truth": 0}, {"key": "314c7c0104eb4113074619b3b3f1e9356114e2f5", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.9273632951048933, "ground_truth": 0}, {"key": "314c7c0104eb4113074619b3b3f1e9356114e2f5", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.9441768598753949, "ground_truth": 0}, {"key": "314c7c0104eb4113074619b3b3f1e9356114e2f5", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.8723473851949262, "ground_truth": 0}, {"key": "314c7c0104eb4113074619b3b3f1e9356114e2f5", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.9111797095241667, "ground_truth": 0}, {"key": "e66546893c2fa5fe38be74e1d1ed104f0c412b4d", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.7185944030295772, "ground_truth": 0}, {"key": "e66546893c2fa5fe38be74e1d1ed104f0c412b4d", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.8056321825782248, "ground_truth": 0}, {"key": "e66546893c2fa5fe38be74e1d1ed104f0c412b4d", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.7185943885023361, "ground_truth": 0}, {"key": "e66546893c2fa5fe38be74e1d1ed104f0c412b4d", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.7217432110801709, "ground_truth": 0}, {"key": "e66546893c2fa5fe38be74e1d1ed104f0c412b4d", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.7431680046851009, "ground_truth": 0}, {"key": "04882672036936ca86bdebed819a133539cbd296", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.8688267822133793, "ground_truth": 0}, {"key": "04882672036936ca86bdebed819a133539cbd296", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.8783142510103631, "ground_truth": 0}, {"key": "04882672036936ca86bdebed819a133539cbd296", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.7732163718130967, "ground_truth": 0}, {"key": "04882672036936ca86bdebed819a133539cbd296", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.902609598942758, "ground_truth": 0}, {"key": "04882672036936ca86bdebed819a133539cbd296", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.8221891241340564, "ground_truth": 0}, {"key": "d5342fb6d8d522f336f2ce34eaa6e62446c0da2e", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.7732163762539676, "ground_truth": 0}, {"key": "d5342fb6d8d522f336f2ce34eaa6e62446c0da2e", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.7732163618019389, "ground_truth": 0}, {"key": "d5342fb6d8d522f336f2ce34eaa6e62446c0da2e", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.8864204196503451, "ground_truth": 0}, {"key": "d5342fb6d8d522f336f2ce34eaa6e62446c0da2e", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.7853085861785344, "ground_truth": 0}, {"key": "d5342fb6d8d522f336f2ce34eaa6e62446c0da2e", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.8548846424161235, "ground_truth": 0}, {"key": "87cdc5b797032387ea9bd0c9a0d7fd57c088e65b", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.9207896800849671, "ground_truth": 0}, {"key": "87cdc5b797032387ea9bd0c9a0d7fd57c088e65b", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.7122321887517398, "ground_truth": 0}, {"key": "87cdc5b797032387ea9bd0c9a0d7fd57c088e65b", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.8740772324758554, "ground_truth": 0}, {"key": "87cdc5b797032387ea9bd0c9a0d7fd57c088e65b", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.8068526210292518, "ground_truth": 0}, {"key": "87cdc5b797032387ea9bd0c9a0d7fd57c088e65b", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.9124361533619708, "ground_truth": 0}, {"key": "4fd3285b643696cd49f08c14b0d482e559f32eed", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.8529354803723999, "ground_truth": 0}, {"key": "4fd3285b643696cd49f08c14b0d482e559f32eed", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.8418256434184155, "ground_truth": 0}, {"key": "4fd3285b643696cd49f08c14b0d482e559f32eed", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.7122321957555882, "ground_truth": 0}, {"key": "4fd3285b643696cd49f08c14b0d482e559f32eed", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.782662477408919, "ground_truth": 0}, {"key": "4fd3285b643696cd49f08c14b0d482e559f32eed", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.7969253716822379, "ground_truth": 0}, {"key": "55930649e6f3cb285a26ef33525f8199bd86d089", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.8509647015823095, "ground_truth": 0}, {"key": "55930649e6f3cb285a26ef33525f8199bd86d089", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.9219218368348017, "ground_truth": 0}, {"key": "55930649e6f3cb285a26ef33525f8199bd86d089", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.8322366541310576, "ground_truth": 0}, {"key": "55930649e6f3cb285a26ef33525f8199bd86d089", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.8652240887510586, "ground_truth": 0}, {"key": "55930649e6f3cb285a26ef33525f8199bd86d089", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.9167080722310453, "ground_truth": 0}, {"key": "8b1c9d7c48a0d857ae857a21395a4996de051915", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.8104789136586971, "ground_truth": 0}, {"key": "8b1c9d7c48a0d857ae857a21395a4996de051915", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.7520125690877459, "ground_truth": 0}, {"key": "8b1c9d7c48a0d857ae857a21395a4996de051915", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.7676898444003712, "ground_truth": 0}, {"key": "8b1c9d7c48a0d857ae857a21395a4996de051915", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.8824278605986585, "ground_truth": 0}, {"key": "8b1c9d7c48a0d857ae857a21395a4996de051915", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.7356416397726746, "ground_truth": 0}, {"key": "d95dce003f0fccc57742bd900c81897c45208c10", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.7648916039404072, "ground_truth": 0}, {"key": "d95dce003f0fccc57742bd900c81897c45208c10", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.8723473836581571, "ground_truth": 0}, {"key": "d95dce003f0fccc57742bd900c81897c45208c10", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.8221891229734182, "ground_truth": 0}, {"key": "d95dce003f0fccc57742bd900c81897c45208c10", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.8344068774334353, "ground_truth": 0}, {"key": "d95dce003f0fccc57742bd900c81897c45208c10", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.8164063651733013, "ground_truth": 0}, {"key": "f732a658c314c090257225483075e4d9fde28b95", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.884039287282258, "ground_truth": 0}, {"key": "f732a658c314c090257225483075e4d9fde28b95", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.9399133521393145, "ground_truth": 0}, {"key": "f732a658c314c090257225483075e4d9fde28b95", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.9390248164588167, "ground_truth": 0}, {"key": "f732a658c314c090257225483075e4d9fde28b95", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.8799743667997095, "ground_truth": 0}, {"key": "f732a658c314c090257225483075e4d9fde28b95", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.9246876919594018, "ground_truth": 0}, {"key": "cbd21ed724b7e4a075ab4ae9a45d9e86d6151283", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.8080672013338955, "ground_truth": 0}, {"key": "cbd21ed724b7e4a075ab4ae9a45d9e86d6151283", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.75779435905592, "ground_truth": 0}, {"key": "cbd21ed724b7e4a075ab4ae9a45d9e86d6151283", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.6740504691166272, "ground_truth": 0}, {"key": "cbd21ed724b7e4a075ab4ae9a45d9e86d6151283", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.6909762816489675, "ground_truth": 0}, {"key": "cbd21ed724b7e4a075ab4ae9a45d9e86d6151283", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.7154239976798444, "ground_truth": 0}, {"key": "4a32d5f29cfb35f3a3966ee041fc1f358503f4b4", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.9111796996290568, "ground_truth": 0}, {"key": "4a32d5f29cfb35f3a3966ee041fc1f358503f4b4", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.9394706112901186, "ground_truth": 0}, {"key": "4a32d5f29cfb35f3a3966ee041fc1f358503f4b4", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.825589733232714, "ground_truth": 0}, {"key": "4a32d5f29cfb35f3a3966ee041fc1f358503f4b4", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.9299510347807537, "ground_truth": 0}, {"key": "4a32d5f29cfb35f3a3966ee041fc1f358503f4b4", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.8925625262709581, "ground_truth": 0}, {"key": "d470c9860671ae720ccc7df115a46d471b4b900a", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.9761291656684098, "ground_truth": 0}, {"key": "d470c9860671ae720ccc7df115a46d471b4b900a", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.973443427273044, "ground_truth": 0}, {"key": "d470c9860671ae720ccc7df115a46d471b4b900a", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.9719924772383781, "ground_truth": 0}, {"key": "d470c9860671ae720ccc7df115a46d471b4b900a", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.9702399048544693, "ground_truth": 0}, {"key": "d470c9860671ae720ccc7df115a46d471b4b900a", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.9241418241008422, "ground_truth": 0}, {"key": "55327ce32c4d5168e8e0fa7b5dabc9a8aafd9d78", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.7981867660749791, "ground_truth": 0}, {"key": "55327ce32c4d5168e8e0fa7b5dabc9a8aafd9d78", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.891811041467447, "ground_truth": 0}, {"key": "55327ce32c4d5168e8e0fa7b5dabc9a8aafd9d78", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.7606506578326456, "ground_truth": 0}, {"key": "55327ce32c4d5168e8e0fa7b5dabc9a8aafd9d78", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.7943849573661274, "ground_truth": 0}, {"key": "55327ce32c4d5168e8e0fa7b5dabc9a8aafd9d78", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.6943026700775555, "ground_truth": 0}, {"key": "022c18def42072e28a37979c622c6ab7e31371de", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.7956581076196824, "ground_truth": 0}, {"key": "022c18def42072e28a37979c622c6ab7e31371de", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.9066531252524466, "ground_truth": 0}, {"key": "022c18def42072e28a37979c622c6ab7e31371de", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.880797077068377, "ground_truth": 0}, {"key": "022c18def42072e28a37979c622c6ab7e31371de", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.7839884570724299, "ground_truth": 0}, {"key": "022c18def42072e28a37979c622c6ab7e31371de", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.8140527971288996, "ground_truth": 0}, {"key": "d49c8ddc7586fcc27a7d310a5cb7703f19e4607d", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.8757869846008765, "ground_truth": 0}, {"key": "d49c8ddc7586fcc27a7d310a5cb7703f19e4607d", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.9059898117144825, "ground_truth": 0}, {"key": "d49c8ddc7586fcc27a7d310a5cb7703f19e4607d", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.9504109739961347, "ground_truth": 0}, {"key": "d49c8ddc7586fcc27a7d310a5cb7703f19e4607d", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.9092645112292584, "ground_truth": 0}, {"key": "d49c8ddc7586fcc27a7d310a5cb7703f19e4607d", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.9348724515089607, "ground_truth": 0}, {"key": "bda116dccb075585a67fd5dd5b759015c7577eb0", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.8757870000414432, "ground_truth": 0}, {"key": "bda116dccb075585a67fd5dd5b759015c7577eb0", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.8568122924126511, "ground_truth": 0}, {"key": "bda116dccb075585a67fd5dd5b759015c7577eb0", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.9124361648971397, "ground_truth": 0}, {"key": "bda116dccb075585a67fd5dd5b759015c7577eb0", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.8679338461572238, "ground_truth": 0}, {"key": "bda116dccb075585a67fd5dd5b759015c7577eb0", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.9224823454608271, "ground_truth": 0}, {"key": "ee0b1bc5ee40697c0792e3906000fe8be5be182a", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.8244619323671935, "ground_truth": 0}, {"key": "ee0b1bc5ee40697c0792e3906000fe8be5be182a", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.7839884748377378, "ground_truth": 0}, {"key": "ee0b1bc5ee40697c0792e3906000fe8be5be182a", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.8386797635785205, "ground_truth": 0}, {"key": "ee0b1bc5ee40697c0792e3906000fe8be5be182a", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.8757869845704818, "ground_truth": 0}, {"key": "ee0b1bc5ee40697c0792e3906000fe8be5be182a", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.8233283947451677, "ground_truth": 0}, {"key": "75b0d4c21581a1b0c1fc5798adba334d8ecc34f3", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.8365545595459999, "ground_truth": 0}, {"key": "75b0d4c21581a1b0c1fc5798adba334d8ecc34f3", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.8697145742074984, "ground_truth": 0}, {"key": "75b0d4c21581a1b0c1fc5798adba334d8ecc34f3", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.8799743649659663, "ground_truth": 0}, {"key": "75b0d4c21581a1b0c1fc5798adba334d8ecc34f3", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.7690802444658794, "ground_truth": 0}, {"key": "75b0d4c21581a1b0c1fc5798adba334d8ecc34f3", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.8766343760480533, "ground_truth": 0}, {"key": "3f7e19cffef13f356e2298c5a63e6c8db20f3d91", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.8615382101278238, "ground_truth": 0}, {"key": "3f7e19cffef13f356e2298c5a63e6c8db20f3d91", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.9246876914286055, "ground_truth": 0}, {"key": "3f7e19cffef13f356e2298c5a63e6c8db20f3d91", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.8749346212306112, "ground_truth": 0}, {"key": "3f7e19cffef13f356e2298c5a63e6c8db20f3d91", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.9149009581456908, "ground_truth": 0}, {"key": "3f7e19cffef13f356e2298c5a63e6c8db20f3d91", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.9005297839386351, "ground_truth": 0}, {"key": "00359f516cdf8b1800c7102711bd9aa400d1c749", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.887984045770597, "ground_truth": 0}, {"key": "00359f516cdf8b1800c7102711bd9aa400d1c749", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.8006920003238446, "ground_truth": 0}, {"key": "00359f516cdf8b1800c7102711bd9aa400d1c749", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.7905303016874788, "ground_truth": 0}, {"key": "00359f516cdf8b1800c7102711bd9aa400d1c749", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.7853085863345098, "ground_truth": 0}, {"key": "00359f516cdf8b1800c7102711bd9aa400d1c749", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.8116760131925556, "ground_truth": 0}, {"key": "f8be2f5ce06cb4af91cbb7b6bef9835991751ef5", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.8344068797047979, "ground_truth": 0}, {"key": "f8be2f5ce06cb4af91cbb7b6bef9835991751ef5", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.7676898465615076, "ground_truth": 0}, {"key": "f8be2f5ce06cb4af91cbb7b6bef9835991751ef5", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.7634837697820052, "ground_truth": 0}, {"key": "f8be2f5ce06cb4af91cbb7b6bef9835991751ef5", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.6859494451403396, "ground_truth": 0}, {"key": "f8be2f5ce06cb4af91cbb7b6bef9835991751ef5", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.7279754286452103, "ground_truth": 0}, {"key": "958a67b8550998886478275b404e2256a6b85c7c", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.8267117932940224, "ground_truth": 0}, {"key": "958a67b8550998886478275b404e2256a6b85c7c", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.831143051616655, "ground_truth": 0}, {"key": "958a67b8550998886478275b404e2256a6b85c7c", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.791821066127301, "ground_truth": 0}, {"key": "958a67b8550998886478275b404e2256a6b85c7c", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.8221891286510014, "ground_truth": 0}, {"key": "958a67b8550998886478275b404e2256a6b85c7c", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.8164063683847457, "ground_truth": 0}, {"key": "4739f160c87994f52e894591194f5df06fed4c39", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.8397339684984045, "ground_truth": 0}, {"key": "4739f160c87994f52e894591194f5df06fed4c39", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.8824278601671355, "ground_truth": 0}, {"key": "4739f160c87994f52e894591194f5df06fed4c39", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.8596637433419858, "ground_truth": 0}, {"key": "4739f160c87994f52e894591194f5df06fed4c39", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.8872046021688578, "ground_truth": 0}, {"key": "4739f160c87994f52e894591194f5df06fed4c39", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.8757869924565721, "ground_truth": 0}, {"key": "027a99a889b38fdb935cd14c204a5fca8a329bc1", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.7866228331530768, "ground_truth": 0}, {"key": "027a99a889b38fdb935cd14c204a5fca8a329bc1", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.7264256100391007, "ground_truth": 0}, {"key": "027a99a889b38fdb935cd14c204a5fca8a329bc1", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.7233094606478798, "ground_truth": 0}, {"key": "027a99a889b38fdb935cd14c204a5fca8a329bc1", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.8044059061546449, "ground_truth": 0}, {"key": "027a99a889b38fdb935cd14c204a5fca8a329bc1", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.6959583504044731, "ground_truth": 0}, {"key": "c7c83a9ee902e568a55898c616f20181952ce057", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.8643104513705497, "ground_truth": 0}, {"key": "c7c83a9ee902e568a55898c616f20181952ce057", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.896251379027679, "ground_truth": 0}, {"key": "c7c83a9ee902e568a55898c616f20181952ce057", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.8449215303751383, "ground_truth": 0}, {"key": "c7c83a9ee902e568a55898c616f20181952ce057", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.8679338557440303, "ground_truth": 0}, {"key": "c7c83a9ee902e568a55898c616f20181952ce057", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.8799743641091188, "ground_truth": 0}, {"key": "7bff6a60ff0b62855bd28562bb820233c0c940e0", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.8652240682559402, "ground_truth": 0}, {"key": "7bff6a60ff0b62855bd28562bb820233c0c940e0", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.7956581058856809, "ground_truth": 0}, {"key": "7bff6a60ff0b62855bd28562bb820233c0c940e0", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.7931059433529033, "ground_truth": 0}, {"key": "7bff6a60ff0b62855bd28562bb820233c0c940e0", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.9161096098567943, "ground_truth": 0}, {"key": "7bff6a60ff0b62855bd28562bb820233c0c940e0", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.7325918366230515, "ground_truth": 0}, {"key": "5ba5e49e25610f42416b2e7ba76d7496acab0f78", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.6057990755004661, "ground_truth": 0}, {"key": "5ba5e49e25610f42416b2e7ba76d7496acab0f78", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.6424324854527476, "ground_truth": 0}, {"key": "5ba5e49e25610f42416b2e7ba76d7496acab0f78", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.7074046825722372, "ground_truth": 0}, {"key": "5ba5e49e25610f42416b2e7ba76d7496acab0f78", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.7122321852719344, "ground_truth": 0}, {"key": "5ba5e49e25610f42416b2e7ba76d7496acab0f78", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.7325918395530352, "ground_truth": 0}, {"key": "0961a6a9fef7ad978ab866a57415578a49ba187f", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.762070095634454, "ground_truth": 0}, {"key": "0961a6a9fef7ad978ab866a57415578a49ba187f", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.8056321774833713, "ground_truth": 0}, {"key": "0961a6a9fef7ad978ab866a57415578a49ba187f", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.8887587917000858, "ground_truth": 0}, {"key": "0961a6a9fef7ad978ab866a57415578a49ba187f", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.8783142457073047, "ground_truth": 0}, {"key": "0961a6a9fef7ad978ab866a57415578a49ba187f", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.8577681116104978, "ground_truth": 0}, {"key": "94148575d23050ffbedb00bddbd826d7137a4fe4", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.8300437622971885, "ground_truth": 0}, {"key": "94148575d23050ffbedb00bddbd826d7137a4fe4", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.8376199644783399, "ground_truth": 0}, {"key": "94148575d23050ffbedb00bddbd826d7137a4fe4", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.8267117969598629, "ground_truth": 0}, {"key": "94148575d23050ffbedb00bddbd826d7137a4fe4", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.8233283891010902, "ground_truth": 0}, {"key": "94148575d23050ffbedb00bddbd826d7137a4fe4", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.8969755644788749, "ground_truth": 0}, {"key": "aaa346e0be1ef1b9c2ce152c859b30e364ea3bc0", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.9582261189156519, "ground_truth": 0}, {"key": "aaa346e0be1ef1b9c2ce152c859b30e364ea3bc0", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.9390248157703304, "ground_truth": 0}, {"key": "aaa346e0be1ef1b9c2ce152c859b30e364ea3bc0", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.9273632956093206, "ground_truth": 0}, {"key": "aaa346e0be1ef1b9c2ce152c859b30e364ea3bc0", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.909907004718857, "ground_truth": 0}, {"key": "aaa346e0be1ef1b9c2ce152c859b30e364ea3bc0", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.8766343859725697, "ground_truth": 0}, {"key": "7604af04967436c4aaf0c7df8b09afcec82f5be0", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.7759445282876694, "ground_truth": 0}, {"key": "7604af04967436c4aaf0c7df8b09afcec82f5be0", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.8289388176512846, "ground_truth": 0}, {"key": "7604af04967436c4aaf0c7df8b09afcec82f5be0", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.7476159529456167, "ground_truth": 0}, {"key": "7604af04967436c4aaf0c7df8b09afcec82f5be0", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.846957838035057, "ground_truth": 0}, {"key": "7604af04967436c4aaf0c7df8b09afcec82f5be0", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.8587185778308457, "ground_truth": 0}, {"key": "1be68b94413120c0b2c7514ffd14b9cfc4413f90", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.8568122892207347, "ground_truth": 0}, {"key": "1be68b94413120c0b2c7514ffd14b9cfc4413f90", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.7008948174210028, "ground_truth": 0}, {"key": "1be68b94413120c0b2c7514ffd14b9cfc4413f90", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.8918110431186623, "ground_truth": 0}, {"key": "1be68b94413120c0b2c7514ffd14b9cfc4413f90", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.8322366547137375, "ground_truth": 0}, {"key": "1be68b94413120c0b2c7514ffd14b9cfc4413f90", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.8278281512366895, "ground_truth": 0}, {"key": "44fc3a2bc441a674f1ebdeabae73278977909db4", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.8816148976025541, "ground_truth": 0}, {"key": "44fc3a2bc441a674f1ebdeabae73278977909db4", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.851952801179977, "ground_truth": 0}, {"key": "44fc3a2bc441a674f1ebdeabae73278977909db4", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.8783142471227992, "ground_truth": 0}, {"key": "44fc3a2bc441a674f1ebdeabae73278977909db4", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.9046505344264342, "ground_truth": 0}, {"key": "44fc3a2bc441a674f1ebdeabae73278977909db4", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.8774767960577022, "ground_truth": 0}, {"key": "fbb06b75e3963c5a810c9f73e4dc5382fbcb7405", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.8824278626539847, "ground_truth": 0}, {"key": "fbb06b75e3963c5a810c9f73e4dc5382fbcb7405", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.8670357576177494, "ground_truth": 0}, {"key": "fbb06b75e3963c5a810c9f73e4dc5382fbcb7405", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.9241418196072099, "ground_truth": 0}, {"key": "fbb06b75e3963c5a810c9f73e4dc5382fbcb7405", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.8031737835390038, "ground_truth": 0}, {"key": "fbb06b75e3963c5a810c9f73e4dc5382fbcb7405", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.8910549618889237, "ground_truth": 0}, {"key": "551839469c1133ef4697ed435c5de192e6076858", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.9118099553030397, "ground_truth": 0}, {"key": "551839469c1133ef4697ed435c5de192e6076858", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.9399133497801481, "ground_truth": 0}, {"key": "551839469c1133ef4697ed435c5de192e6076858", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.8596637496505504, "ground_truth": 0}, {"key": "551839469c1133ef4697ed435c5de192e6076858", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.9136765205320848, "ground_truth": 0}, {"key": "551839469c1133ef4697ed435c5de192e6076858", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.9073122159762622, "ground_truth": 0}, {"key": "386e149797954c4b5cd52bcad0beece29f7eb04a", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.8643104575080505, "ground_truth": 0}, {"key": "386e149797954c4b5cd52bcad0beece29f7eb04a", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.801935821353164, "ground_truth": 0}, {"key": "386e149797954c4b5cd52bcad0beece29f7eb04a", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.7476159517427599, "ground_truth": 0}, {"key": "386e149797954c4b5cd52bcad0beece29f7eb04a", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.8918110437705287, "ground_truth": 0}, {"key": "386e149797954c4b5cd52bcad0beece29f7eb04a", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.7879311906837817, "ground_truth": 0}, {"key": "25abfd6bf83eb62bdd4daf1f542d61b54ab2871d", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.8902942321682672, "ground_truth": 0}, {"key": "25abfd6bf83eb62bdd4daf1f542d61b54ab2871d", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.8848377615455104, "ground_truth": 0}, {"key": "25abfd6bf83eb62bdd4daf1f542d61b54ab2871d", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.8774767989471148, "ground_truth": 0}, {"key": "25abfd6bf83eb62bdd4daf1f542d61b54ab2871d", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.8991213738454575, "ground_truth": 0}, {"key": "25abfd6bf83eb62bdd4daf1f542d61b54ab2871d", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.7994423252751225, "ground_truth": 0}, {"key": "e5e0f9ea6381d513d4632644634d7c12e1c6c4cb", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.8984105527809609, "ground_truth": 0}, {"key": "e5e0f9ea6381d513d4632644634d7c12e1c6c4cb", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.804405913837354, "ground_truth": 0}, {"key": "e5e0f9ea6381d513d4632644634d7c12e1c6c4cb", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.8807970761175175, "ground_truth": 0}, {"key": "e5e0f9ea6381d513d4632644634d7c12e1c6c4cb", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.8397339674919825, "ground_truth": 0}, {"key": "e5e0f9ea6381d513d4632644634d7c12e1c6c4cb", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.782662480818301, "ground_truth": 0}, {"key": "4e660c57fb36c03622b3ff9f9d0e78a0f7b0aea9", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.7648916056421793, "ground_truth": 0}, {"key": "4e660c57fb36c03622b3ff9f9d0e78a0f7b0aea9", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.7185943920778335, "ground_truth": 0}, {"key": "4e660c57fb36c03622b3ff9f9d0e78a0f7b0aea9", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.7386690790612912, "ground_truth": 0}, {"key": "4e660c57fb36c03622b3ff9f9d0e78a0f7b0aea9", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.8568122901055307, "ground_truth": 0}, {"key": "4e660c57fb36c03622b3ff9f9d0e78a0f7b0aea9", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.7892336962293495, "ground_truth": 0}, {"key": "586458cf89c9c2ddc5a7925e275f135245f5a0fc", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.8633916063636259, "ground_truth": 0}, {"key": "586458cf89c9c2ddc5a7925e275f135245f5a0fc", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.9111797164259797, "ground_truth": 0}, {"key": "586458cf89c9c2ddc5a7925e275f135245f5a0fc", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.8856314741925966, "ground_truth": 0}, {"key": "586458cf89c9c2ddc5a7925e275f135245f5a0fc", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.9294404014924587, "ground_truth": 0}, {"key": "586458cf89c9c2ddc5a7925e275f135245f5a0fc", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.9005297893524208, "ground_truth": 0}, {"key": "8aca433d3662b6ffe76ef4026bdcd7cf784aacec", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.6424324782111999, "ground_truth": 0}, {"key": "8aca433d3662b6ffe76ef4026bdcd7cf784aacec", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.7505527629403508, "ground_truth": 0}, {"key": "8aca433d3662b6ffe76ef4026bdcd7cf784aacec", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.501953117452213, "ground_truth": 0}, {"key": "8aca433d3662b6ffe76ef4026bdcd7cf784aacec", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.6548947191170246, "ground_truth": 0}, {"key": "8aca433d3662b6ffe76ef4026bdcd7cf784aacec", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.36658975200001626, "ground_truth": 0}, {"key": "066f8568d9c1c23ca3aeb23330123e7dd8967208", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.9579122701075347, "ground_truth": 0}, {"key": "066f8568d9c1c23ca3aeb23330123e7dd8967208", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.9324533009419841, "ground_truth": 0}, {"key": "066f8568d9c1c23ca3aeb23330123e7dd8967208", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.891811048352718, "ground_truth": 0}, {"key": "066f8568d9c1c23ca3aeb23330123e7dd8967208", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.9202179836621591, "ground_truth": 0}, {"key": "066f8568d9c1c23ca3aeb23330123e7dd8967208", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.8688267835604088, "ground_truth": 0}, {"key": "6589398915f67576609586704d5bcca6538c4727", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.9155072513364143, "ground_truth": 0}, {"key": "6589398915f67576609586704d5bcca6538c4727", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.8998277785227685, "ground_truth": 0}, {"key": "6589398915f67576609586704d5bcca6538c4727", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.8887587939652166, "ground_truth": 0}, {"key": "6589398915f67576609586704d5bcca6538c4727", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.9645892698426132, "ground_truth": 0}, {"key": "6589398915f67576609586704d5bcca6538c4727", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.8799743778026707, "ground_truth": 0}, {"key": "cb4d9818866490b281e8f5529c9957ba366390e7", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.7461389780647293, "ground_truth": 0}, {"key": "cb4d9818866490b281e8f5529c9957ba366390e7", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.7549149906671182, "ground_truth": 0}, {"key": "cb4d9818866490b281e8f5529c9957ba366390e7", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.7563575485482589, "ground_truth": 0}, {"key": "cb4d9818866490b281e8f5529c9957ba366390e7", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.5563995846310338, "ground_truth": 0}, {"key": "cb4d9818866490b281e8f5529c9957ba366390e7", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.738669079832599, "ground_truth": 0}, {"key": "83181eb5628b02f9af1cf8be0b9e3d7841f6f94c", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.7106282779790203, "ground_truth": 0}, {"key": "83181eb5628b02f9af1cf8be0b9e3d7841f6f94c", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.7122321974341655, "ground_truth": 0}, {"key": "83181eb5628b02f9af1cf8be0b9e3d7841f6f94c", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.8577681142117651, "ground_truth": 0}, {"key": "83181eb5628b02f9af1cf8be0b9e3d7841f6f94c", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.8714748686841791, "ground_truth": 0}, {"key": "83181eb5628b02f9af1cf8be0b9e3d7841f6f94c", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.8344068957931374, "ground_truth": 0}, {"key": "addda21620885e1019305bce0cbf308b421dc0ba", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.7264256186176804, "ground_truth": 0}, {"key": "addda21620885e1019305bce0cbf308b421dc0ba", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.756357553546891, "ground_truth": 0}, {"key": "addda21620885e1019305bce0cbf308b421dc0ba", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.756357559886399, "ground_truth": 0}, {"key": "addda21620885e1019305bce0cbf308b421dc0ba", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.8824278623416767, "ground_truth": 0}, {"key": "addda21620885e1019305bce0cbf308b421dc0ba", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.8344068864103621, "ground_truth": 0}, {"key": "6a0a6f44de4059e1d7ef83841b3fd5e95e278ba2", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.7201714952424639, "ground_truth": 0}, {"key": "6a0a6f44de4059e1d7ef83841b3fd5e95e278ba2", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.8116760145647964, "ground_truth": 0}, {"key": "6a0a6f44de4059e1d7ef83841b3fd5e95e278ba2", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.7772998573771618, "ground_truth": 0}, {"key": "6a0a6f44de4059e1d7ef83841b3fd5e95e278ba2", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.8092759771528152, "ground_truth": 0}, {"key": "6a0a6f44de4059e1d7ef83841b3fd5e95e278ba2", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.8116760186739, "ground_truth": 0}, {"key": "b5313efdec6d9afa6f43f26378c6065fcc9c7535", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.6706082797210788, "ground_truth": 0}, {"key": "b5313efdec6d9afa6f43f26378c6065fcc9c7535", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.8267117945107877, "ground_truth": 0}, {"key": "b5313efdec6d9afa6f43f26378c6065fcc9c7535", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.6584174973336229, "ground_truth": 0}, {"key": "b5313efdec6d9afa6f43f26378c6065fcc9c7535", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.8397339702971263, "ground_truth": 0}, {"key": "b5313efdec6d9afa6f43f26378c6065fcc9c7535", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.8449215404658994, "ground_truth": 0}, {"key": "0644f27692b67af8f52f9518e29981de11684cd7", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.9603611591982854, "ground_truth": 0}, {"key": "0644f27692b67af8f52f9518e29981de11684cd7", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.934872450468532, "ground_truth": 0}, {"key": "0644f27692b67af8f52f9518e29981de11684cd7", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.9190632871201354, "ground_truth": 0}, {"key": "0644f27692b67af8f52f9518e29981de11684cd7", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.9207896744296954, "ground_truth": 0}, {"key": "0644f27692b67af8f52f9518e29981de11684cd7", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.9485372356721498, "ground_truth": 0}, {"key": "19dbfe3918d9bdd7b5f1792631c5e3e424146473", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.903974511702334, "ground_truth": 0}, {"key": "19dbfe3918d9bdd7b5f1792631c5e3e424146473", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.9130583340588893, "ground_truth": 0}, {"key": "19dbfe3918d9bdd7b5f1792631c5e3e424146473", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.83761996562256, "ground_truth": 0}, {"key": "19dbfe3918d9bdd7b5f1792631c5e3e424146473", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.8529354670100373, "ground_truth": 0}, {"key": "19dbfe3918d9bdd7b5f1792631c5e3e424146473", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.8333245953431668, "ground_truth": 0}, {"key": "0f4fcaf8fd58c40bc31c4715cd230bb0f80f2d98", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.7905303069310248, "ground_truth": 0}, {"key": "0f4fcaf8fd58c40bc31c4715cd230bb0f80f2d98", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.8344068834165667, "ground_truth": 0}, {"key": "0f4fcaf8fd58c40bc31c4715cd230bb0f80f2d98", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.6370308125884826, "ground_truth": 0}, {"key": "0f4fcaf8fd58c40bc31c4715cd230bb0f80f2d98", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.7279754386573721, "ground_truth": 0}, {"key": "0f4fcaf8fd58c40bc31c4715cd230bb0f80f2d98", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.8840392905406881, "ground_truth": 0}, {"key": "4aa90d4a364e8bd252a2a2e57f1bb4c9dab57062", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.8031737922225273, "ground_truth": 0}, {"key": "4aa90d4a364e8bd252a2a2e57f1bb4c9dab57062", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.8267117976608774, "ground_truth": 0}, {"key": "4aa90d4a364e8bd252a2a2e57f1bb4c9dab57062", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.6723316928878211, "ground_truth": 0}, {"key": "4aa90d4a364e8bd252a2a2e57f1bb4c9dab57062", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.7826624913216409, "ground_truth": 0}, {"key": "4aa90d4a364e8bd252a2a2e57f1bb4c9dab57062", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.5869964391141566, "ground_truth": 0}, {"key": "239d0e3b504e4b9e1e6eb20eb77c8a873a2f5657", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.8499711749153632, "ground_truth": 0}, {"key": "239d0e3b504e4b9e1e6eb20eb77c8a873a2f5657", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.8164063709610624, "ground_truth": 0}, {"key": "239d0e3b504e4b9e1e6eb20eb77c8a873a2f5657", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.7981867654551899, "ground_truth": 0}, {"key": "239d0e3b504e4b9e1e6eb20eb77c8a873a2f5657", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.750552748997412, "ground_truth": 0}, {"key": "239d0e3b504e4b9e1e6eb20eb77c8a873a2f5657", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.8044059030751876, "ground_truth": 0}, {"key": "6ef705715b84a961f971d624e9574da6a65dd3ef", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.9492946360457196, "ground_truth": 0}, {"key": "6ef705715b84a961f971d624e9574da6a65dd3ef", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.9073122171211561, "ground_truth": 0}, {"key": "6ef705715b84a961f971d624e9574da6a65dd3ef", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.9381240107012888, "ground_truth": 0}, {"key": "6ef705715b84a961f971d624e9574da6a65dd3ef", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.948154533505225, "ground_truth": 0}, {"key": "6ef705715b84a961f971d624e9574da6a65dd3ef", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.9196425375046744, "ground_truth": 0}, {"key": "e3f24714630bd679c4b4fdb77e90f785beb1ff33", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.8044059168437818, "ground_truth": 0}, {"key": "e3f24714630bd679c4b4fdb77e90f785beb1ff33", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.8969755650732417, "ground_truth": 0}, {"key": "e3f24714630bd679c4b4fdb77e90f785beb1ff33", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.8766343814073025, "ground_truth": 0}, {"key": "e3f24714630bd679c4b4fdb77e90f785beb1ff33", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.9257686316160999, "ground_truth": 0}, {"key": "e3f24714630bd679c4b4fdb77e90f785beb1ff33", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.8529354759068004, "ground_truth": 0}, {"key": "589dc58218fe8920f0949cc7af767b6daf5018bc", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.830043758163607, "ground_truth": 0}, {"key": "589dc58218fe8920f0949cc7af767b6daf5018bc", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.899121383508118, "ground_truth": 0}, {"key": "589dc58218fe8920f0949cc7af767b6daf5018bc", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.8783142486662138, "ground_truth": 0}, {"key": "589dc58218fe8920f0949cc7af767b6daf5018bc", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.8918110490129084, "ground_truth": 0}, {"key": "589dc58218fe8920f0949cc7af767b6daf5018bc", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.8221891258402785, "ground_truth": 0}, {"key": "06254d21e94c9c0b027629a1df90298887c31f14", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.8397339617684483, "ground_truth": 0}, {"key": "06254d21e94c9c0b027629a1df90298887c31f14", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.665410567454403, "ground_truth": 0}, {"key": "06254d21e94c9c0b027629a1df90298887c31f14", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.7606506613909705, "ground_truth": 0}, {"key": "06254d21e94c9c0b027629a1df90298887c31f14", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.6876299915005603, "ground_truth": 0}, {"key": "06254d21e94c9c0b027629a1df90298887c31f14", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.7534666561366978, "ground_truth": 0}, {"key": "5b93cafa2843ab23eb5baf8bb0bec93d0fc46864", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.936285000825241, "ground_truth": 0}, {"key": "5b93cafa2843ab23eb5baf8bb0bec93d0fc46864", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.9235923179351161, "ground_truth": 0}, {"key": "5b93cafa2843ab23eb5baf8bb0bec93d0fc46864", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.8872046021132001, "ground_truth": 0}, {"key": "5b93cafa2843ab23eb5baf8bb0bec93d0fc46864", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.9111797079870297, "ground_truth": 0}, {"key": "5b93cafa2843ab23eb5baf8bb0bec93d0fc46864", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.9019206764283624, "ground_truth": 0}, {"key": "22f9667453cf7ea8a39080edde645776d5edc6f7", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.7892336972190274, "ground_truth": 0}, {"key": "22f9667453cf7ea8a39080edde645776d5edc6f7", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.7718435053381661, "ground_truth": 0}, {"key": "22f9667453cf7ea8a39080edde645776d5edc6f7", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.7931059409887201, "ground_truth": 0}, {"key": "22f9667453cf7ea8a39080edde645776d5edc6f7", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.692641993266152, "ground_truth": 0}, {"key": "22f9667453cf7ea8a39080edde645776d5edc6f7", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.6671476638916056, "ground_truth": 0}, {"key": "521fc18da417d441ba600a4abdbf279bb0c8f69d", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.6723316976417902, "ground_truth": 0}, {"key": "521fc18da417d441ba600a4abdbf279bb0c8f69d", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.7956581060907408, "ground_truth": 0}, {"key": "521fc18da417d441ba600a4abdbf279bb0c8f69d", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.9012274112212791, "ground_truth": 0}, {"key": "521fc18da417d441ba600a4abdbf279bb0c8f69d", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.7310585713531942, "ground_truth": 0}, {"key": "521fc18da417d441ba600a4abdbf279bb0c8f69d", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.858718592252807, "ground_truth": 0}, {"key": "48fd5553806beaaa508596b0c8267a1ee703a8fe", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.8128673134222035, "ground_truth": 0}, {"key": "48fd5553806beaaa508596b0c8267a1ee703a8fe", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.9039745059451586, "ground_truth": 0}, {"key": "48fd5553806beaaa508596b0c8267a1ee703a8fe", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.8104788997041404, "ground_truth": 0}, {"key": "48fd5553806beaaa508596b0c8267a1ee703a8fe", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.8887587864683568, "ground_truth": 0}, {"key": "48fd5553806beaaa508596b0c8267a1ee703a8fe", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.8116760088818546, "ground_truth": 0}, {"key": "f9b3e0253b7325cd0d37841a38c9f10a22c77c49", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.8879840487784935, "ground_truth": 0}, {"key": "f9b3e0253b7325cd0d37841a38c9f10a22c77c49", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.8116760189787996, "ground_truth": 0}, {"key": "f9b3e0253b7325cd0d37841a38c9f10a22c77c49", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.8816149003404486, "ground_truth": 0}, {"key": "f9b3e0253b7325cd0d37841a38c9f10a22c77c49", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.824461935494684, "ground_truth": 0}, {"key": "f9b3e0253b7325cd0d37841a38c9f10a22c77c49", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.8006920002131741, "ground_truth": 0}, {"key": "3228a9d82b3829a4f09698b746db4036ebb38ad0", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.8577681105440305, "ground_truth": 0}, {"key": "3228a9d82b3829a4f09698b746db4036ebb38ad0", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.9184802448800499, "ground_truth": 0}, {"key": "3228a9d82b3829a4f09698b746db4036ebb38ad0", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.7994423305175207, "ground_truth": 0}, {"key": "3228a9d82b3829a4f09698b746db4036ebb38ad0", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.6893056073462944, "ground_truth": 0}, {"key": "3228a9d82b3829a4f09698b746db4036ebb38ad0", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.8428631479802633, "ground_truth": 0}, {"key": "ee02f2bd6eaf55c06fef208248197679d2d96897", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.9309620681956757, "ground_truth": 0}, {"key": "ee02f2bd6eaf55c06fef208248197679d2d96897", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.8255897251450536, "ground_truth": 0}, {"key": "ee02f2bd6eaf55c06fef208248197679d2d96897", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.8499711762964309, "ground_truth": 0}, {"key": "ee02f2bd6eaf55c06fef208248197679d2d96897", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.8705972702264833, "ground_truth": 0}, {"key": "ee02f2bd6eaf55c06fef208248197679d2d96897", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.925768633736773, "ground_truth": 0}, {"key": "c8da607c6ffe49104ceacd4fe484581042e7f21a", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.867933856735028, "ground_truth": 0}, {"key": "c8da607c6ffe49104ceacd4fe484581042e7f21a", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.7476159612679015, "ground_truth": 0}, {"key": "c8da607c6ffe49104ceacd4fe484581042e7f21a", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.8104789023917435, "ground_truth": 0}, {"key": "c8da607c6ffe49104ceacd4fe484581042e7f21a", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.8714748648843101, "ground_truth": 0}, {"key": "c8da607c6ffe49104ceacd4fe484581042e7f21a", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.9155072462625415, "ground_truth": 0}, {"key": "aeca50944e5a49735193304117849531fb4d667d", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.7943849615379062, "ground_truth": 0}, {"key": "aeca50944e5a49735193304117849531fb4d667d", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.8289388084918767, "ground_truth": 0}, {"key": "aeca50944e5a49735193304117849531fb4d667d", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.7826624940951401, "ground_truth": 0}, {"key": "aeca50944e5a49735193304117849531fb4d667d", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.7138307446634251, "ground_truth": 0}, {"key": "aeca50944e5a49735193304117849531fb4d667d", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.7606506691245758, "ground_truth": 0}, {"key": "301c27b4468420252a14f4c87c2b208c6b3259e1", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.7325918403109591, "ground_truth": 0}, {"key": "301c27b4468420252a14f4c87c2b208c6b3259e1", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.8407825910393151, "ground_truth": 0}, {"key": "301c27b4468420252a14f4c87c2b208c6b3259e1", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.638835272500555, "ground_truth": 0}, {"key": "301c27b4468420252a14f4c87c2b208c6b3259e1", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.842863139619575, "ground_truth": 0}, {"key": "301c27b4468420252a14f4c87c2b208c6b3259e1", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.7138307409499083, "ground_truth": 0}, {"key": "9b5fc45f61bff9323a7744c1db605618763cb85c", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.8092759759744339, "ground_truth": 0}, {"key": "9b5fc45f61bff9323a7744c1db605618763cb85c", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.8783142452136241, "ground_truth": 0}, {"key": "9b5fc45f61bff9323a7744c1db605618763cb85c", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.7416740276523507, "ground_truth": 0}, {"key": "9b5fc45f61bff9323a7744c1db605618763cb85c", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.8365545571384341, "ground_truth": 0}, {"key": "9b5fc45f61bff9323a7744c1db605618763cb85c", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.9053222962802079, "ground_truth": 0}, {"key": "43144b95b0f947f2c6d40122fecd69ced8a4af92", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.7592254059297582, "ground_truth": 0}, {"key": "43144b95b0f947f2c6d40122fecd69ced8a4af92", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.8418256411956138, "ground_truth": 0}, {"key": "43144b95b0f947f2c6d40122fecd69ced8a4af92", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.8233283886031707, "ground_truth": 0}, {"key": "43144b95b0f947f2c6d40122fecd69ced8a4af92", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.8407826049562245, "ground_truth": 0}, {"key": "43144b95b0f947f2c6d40122fecd69ced8a4af92", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.877476783983733, "ground_truth": 0}, {"key": "58b49fef1d6d2be5211848adc2882b59f043a933", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.7264256097569943, "ground_truth": 0}, {"key": "58b49fef1d6d2be5211848adc2882b59f043a933", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.8128673143739029, "ground_truth": 0}, {"key": "58b49fef1d6d2be5211848adc2882b59f043a933", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.6976089205759374, "ground_truth": 0}, {"key": "58b49fef1d6d2be5211848adc2882b59f043a933", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.8606036124228318, "ground_truth": 0}, {"key": "58b49fef1d6d2be5211848adc2882b59f043a933", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.7918210534246121, "ground_truth": 0}, {"key": "bdcc1253f679b14e54451db44f4f0e39af4bb559", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.9046505387740656, "ground_truth": 0}, {"key": "bdcc1253f679b14e54451db44f4f0e39af4bb559", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.8428631481426645, "ground_truth": 0}, {"key": "bdcc1253f679b14e54451db44f4f0e39af4bb559", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.9118099567474324, "ground_truth": 0}, {"key": "bdcc1253f679b14e54451db44f4f0e39af4bb559", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.939470609363367, "ground_truth": 0}, {"key": "bdcc1253f679b14e54451db44f4f0e39af4bb559", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.8643104530813296, "ground_truth": 0}, {"key": "b22b1636da5dd15364b6f0c342e4ce4903e51c2a", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.8998277761754158, "ground_truth": 0}, {"key": "b22b1636da5dd15364b6f0c342e4ce4903e51c2a", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.854884638556746, "ground_truth": 0}, {"key": "b22b1636da5dd15364b6f0c342e4ce4903e51c2a", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.7853085661771182, "ground_truth": 0}, {"key": "b22b1636da5dd15364b6f0c342e4ce4903e51c2a", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.8300437644488612, "ground_truth": 0}, {"key": "b22b1636da5dd15364b6f0c342e4ce4903e51c2a", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.7981867876722675, "ground_truth": 0}, {"key": "55986d11e0d0e5b031567157cf1f157610c65c31", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.9441768586571055, "ground_truth": 0}, {"key": "55986d11e0d0e5b031567157cf1f157610c65c31", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.8887587849314249, "ground_truth": 0}, {"key": "55986d11e0d0e5b031567157cf1f157610c65c31", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.8449215311622039, "ground_truth": 0}, {"key": "55986d11e0d0e5b031567157cf1f157610c65c31", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.9053223008328911, "ground_truth": 0}, {"key": "55986d11e0d0e5b031567157cf1f157610c65c31", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.7866228258465151, "ground_truth": 0}, {"key": "0a37124fe35e31ae9fe8dd7715aeed88002e23e9", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.7356416275305251, "ground_truth": 0}, {"key": "0a37124fe35e31ae9fe8dd7715aeed88002e23e9", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.7592253939811502, "ground_truth": 0}, {"key": "0a37124fe35e31ae9fe8dd7715aeed88002e23e9", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.8732148271885404, "ground_truth": 0}, {"key": "0a37124fe35e31ae9fe8dd7715aeed88002e23e9", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.7956580997326083, "ground_truth": 0}, {"key": "0a37124fe35e31ae9fe8dd7715aeed88002e23e9", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.8128673118051563, "ground_truth": 0}, {"key": "ef3ee3ab85ed8802b6b76444bccb46256077963e", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.7341195273331578, "ground_truth": 0}, {"key": "ef3ee3ab85ed8802b6b76444bccb46256077963e", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.6132365580506414, "ground_truth": 0}, {"key": "ef3ee3ab85ed8802b6b76444bccb46256077963e", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.5136684856414029, "ground_truth": 0}, {"key": "ef3ee3ab85ed8802b6b76444bccb46256077963e", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.5563995790599459, "ground_truth": 0}, {"key": "ef3ee3ab85ed8802b6b76444bccb46256077963e", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.6757646045861275, "ground_truth": 0}, {"key": "fb17ac082bd3f3af3dad8c8d36d9ea56360c520e", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.944994715962884, "ground_truth": 0}, {"key": "fb17ac082bd3f3af3dad8c8d36d9ea56360c520e", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.8577681105904855, "ground_truth": 0}, {"key": "fb17ac082bd3f3af3dad8c8d36d9ea56360c520e", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.9155072466638511, "ground_truth": 0}, {"key": "fb17ac082bd3f3af3dad8c8d36d9ea56360c520e", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.9149009541844895, "ground_truth": 0}, {"key": "fb17ac082bd3f3af3dad8c8d36d9ea56360c520e", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.93146250660788, "ground_truth": 0}, {"key": "59f079f6095cbb82b0eaaa0ba5fc29cdaff1f81b", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.8925625228179607, "ground_truth": 0}, {"key": "59f079f6095cbb82b0eaaa0ba5fc29cdaff1f81b", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.8872046035206215, "ground_truth": 0}, {"key": "59f079f6095cbb82b0eaaa0ba5fc29cdaff1f81b", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.8856314751325872, "ground_truth": 0}, {"key": "59f079f6095cbb82b0eaaa0ba5fc29cdaff1f81b", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.8991213801573111, "ground_truth": 0}, {"key": "59f079f6095cbb82b0eaaa0ba5fc29cdaff1f81b", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.7662936520773109, "ground_truth": 0}, {"key": "083bc4309f2ea52be2a378e78566d7dcc9f4dd73", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.9167080690511513, "ground_truth": 0}, {"key": "083bc4309f2ea52be2a378e78566d7dcc9f4dd73", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.9066531231715149, "ground_truth": 0}, {"key": "083bc4309f2ea52be2a378e78566d7dcc9f4dd73", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.8289388197376434, "ground_truth": 0}, {"key": "083bc4309f2ea52be2a378e78566d7dcc9f4dd73", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.938575960193933, "ground_truth": 0}, {"key": "083bc4309f2ea52be2a378e78566d7dcc9f4dd73", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.8947894622960896, "ground_truth": 0}, {"key": "ac56bd50e449bfa1d7b923415afa2ae5f7c83392", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.8633916082519594, "ground_truth": 0}, {"key": "ac56bd50e449bfa1d7b923415afa2ae5f7c83392", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.875786993387891, "ground_truth": 0}, {"key": "ac56bd50e449bfa1d7b923415afa2ae5f7c83392", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.8210441028020518, "ground_truth": 0}, {"key": "ac56bd50e449bfa1d7b923415afa2ae5f7c83392", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.9136765257756252, "ground_truth": 0}, {"key": "ac56bd50e449bfa1d7b923415afa2ae5f7c83392", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.649578626464551, "ground_truth": 0}, {"key": "61e4747776bd844146a9b8c7c1913c827ffbcd8a", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.9492946362078875, "ground_truth": 0}, {"key": "61e4747776bd844146a9b8c7c1913c827ffbcd8a", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.96641049267423, "ground_truth": 0}, {"key": "61e4747776bd844146a9b8c7c1913c827ffbcd8a", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.9353465094433451, "ground_truth": 0}, {"key": "61e4747776bd844146a9b8c7c1913c827ffbcd8a", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.950041476060626, "ground_truth": 0}, {"key": "61e4747776bd844146a9b8c7c1913c827ffbcd8a", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.9518632318912792, "ground_truth": 0}, {"key": "a9854fc40719b0d083a3fd279b6196188228a4e0", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.7704647921263728, "ground_truth": 0}, {"key": "a9854fc40719b0d083a3fd279b6196188228a4e0", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.7866228137821838, "ground_truth": 0}, {"key": "a9854fc40719b0d083a3fd279b6196188228a4e0", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.6723317091144877, "ground_truth": 0}, {"key": "a9854fc40719b0d083a3fd279b6196188228a4e0", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.729519768425564, "ground_truth": 0}, {"key": "a9854fc40719b0d083a3fd279b6196188228a4e0", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.8947894723824096, "ground_truth": 0}, {"key": "8d37ab9fcd0248c093f6d0e5682782ebdaf5e837", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.8832359911785206, "ground_truth": 0}, {"key": "8d37ab9fcd0248c093f6d0e5682782ebdaf5e837", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.8479677483130239, "ground_truth": 0}, {"key": "8d37ab9fcd0248c093f6d0e5682782ebdaf5e837", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.8887587909686134, "ground_truth": 0}, {"key": "8d37ab9fcd0248c093f6d0e5682782ebdaf5e837", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.8489722009833617, "ground_truth": 0}, {"key": "8d37ab9fcd0248c093f6d0e5682782ebdaf5e837", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.852935470440479, "ground_truth": 0}, {"key": "d3199d123dedcdbae55b2e9d1f658717c1d5e233", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.8044058979370425, "ground_truth": 0}, {"key": "d3199d123dedcdbae55b2e9d1f658717c1d5e233", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.6976089163610741, "ground_truth": 0}, {"key": "d3199d123dedcdbae55b2e9d1f658717c1d5e233", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.7943849585820371, "ground_truth": 0}, {"key": "d3199d123dedcdbae55b2e9d1f658717c1d5e233", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.8152325027221621, "ground_truth": 0}, {"key": "d3199d123dedcdbae55b2e9d1f658717c1d5e233", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.6774739843775702, "ground_truth": 0}, {"key": "f249ede5a3cafd2506ff2bb400291a7db1c43b76", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.896975566918767, "ground_truth": 0}, {"key": "f249ede5a3cafd2506ff2bb400291a7db1c43b76", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.911179709812425, "ground_truth": 0}, {"key": "f249ede5a3cafd2506ff2bb400291a7db1c43b76", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.9079671404033394, "ground_truth": 0}, {"key": "f249ede5a3cafd2506ff2bb400291a7db1c43b76", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.8529354722356738, "ground_truth": 0}, {"key": "f249ede5a3cafd2506ff2bb400291a7db1c43b76", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.7170118813645395, "ground_truth": 0}, {"key": "6343a202a70e8c5d3bfa4042bfd087d78ca5805e", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.5292633794130042, "ground_truth": 0}, {"key": "6343a202a70e8c5d3bfa4042bfd087d78ca5805e", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.7279754268659345, "ground_truth": 0}, {"key": "6343a202a70e8c5d3bfa4042bfd087d78ca5805e", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.6315942930234665, "ground_truth": 0}, {"key": "6343a202a70e8c5d3bfa4042bfd087d78ca5805e", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.5292633938667177, "ground_truth": 0}, {"key": "6343a202a70e8c5d3bfa4042bfd087d78ca5805e", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.5813030979767209, "ground_truth": 0}, {"key": "da0d41b431367b51fd995573cb498c10b7f64ca0", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.8840392837618755, "ground_truth": 0}, {"key": "da0d41b431367b51fd995573cb498c10b7f64ca0", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.9252299511076831, "ground_truth": 0}, {"key": "da0d41b431367b51fd995573cb498c10b7f64ca0", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.8705972711318621, "ground_truth": 0}, {"key": "da0d41b431367b51fd995573cb498c10b7f64ca0", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.8386797645723469, "ground_truth": 0}, {"key": "da0d41b431367b51fd995573cb498c10b7f64ca0", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.8568122935273331, "ground_truth": 0}, {"key": "0620ff5fa324a35b4be54bbd2de49b42bdd0d7c0", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.781330628611297, "ground_truth": 0}, {"key": "0620ff5fa324a35b4be54bbd2de49b42bdd0d7c0", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.7799929084283559, "ground_truth": 0}, {"key": "0620ff5fa324a35b4be54bbd2de49b42bdd0d7c0", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.8856314770651622, "ground_truth": 0}, {"key": "0620ff5fa324a35b4be54bbd2de49b42bdd0d7c0", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.8577681077057183, "ground_truth": 0}, {"key": "0620ff5fa324a35b4be54bbd2de49b42bdd0d7c0", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.865224078228625, "ground_truth": 0}, {"key": "f0eb8f9eee266512eb604a51b482833e202531d8", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.9155072403091458, "ground_truth": 0}, {"key": "f0eb8f9eee266512eb604a51b482833e202531d8", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.9019206700491275, "ground_truth": 0}, {"key": "f0eb8f9eee266512eb604a51b482833e202531d8", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.8940517189538422, "ground_truth": 0}, {"key": "f0eb8f9eee266512eb604a51b482833e202531d8", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.8848377655248922, "ground_truth": 0}, {"key": "f0eb8f9eee266512eb604a51b482833e202531d8", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.9099070038118361, "ground_truth": 0}, {"key": "c8f743307d5d1f7f19f1474d68c9390b22f6d076", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.7956580934280675, "ground_truth": 0}, {"key": "c8f743307d5d1f7f19f1474d68c9390b22f6d076", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.7918210593785715, "ground_truth": 0}, {"key": "c8f743307d5d1f7f19f1474d68c9390b22f6d076", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.8902942412152854, "ground_truth": 0}, {"key": "c8f743307d5d1f7f19f1474d68c9390b22f6d076", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.8068526271547659, "ground_truth": 0}, {"key": "c8f743307d5d1f7f19f1474d68c9390b22f6d076", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.7634837549199014, "ground_truth": 0}, {"key": "5978abfdad91e604840a2dcc993df5ade9448e82", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.8887587854961106, "ground_truth": 0}, {"key": "5978abfdad91e604840a2dcc993df5ade9448e82", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.9213576209640209, "ground_truth": 0}, {"key": "5978abfdad91e604840a2dcc993df5ade9448e82", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.8596637576305766, "ground_truth": 0}, {"key": "5978abfdad91e604840a2dcc993df5ade9448e82", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.8840392850674833, "ground_truth": 0}, {"key": "5978abfdad91e604840a2dcc993df5ade9448e82", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.8376199746815952, "ground_truth": 0}, {"key": "5bcd4e61b39cc7ffff38ad88cd40afa208b18528", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.810478919952065, "ground_truth": 0}, {"key": "5bcd4e61b39cc7ffff38ad88cd40afa208b18528", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.8670357548687155, "ground_truth": 0}, {"key": "5bcd4e61b39cc7ffff38ad88cd40afa208b18528", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.8539127574474733, "ground_truth": 0}, {"key": "5bcd4e61b39cc7ffff38ad88cd40afa208b18528", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.7520125675417848, "ground_truth": 0}, {"key": "5bcd4e61b39cc7ffff38ad88cd40afa208b18528", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.896975574625017, "ground_truth": 0}, {"key": "44815c184e3013f07781311b30ec5ff009174738", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.8606036240426947, "ground_truth": 0}, {"key": "44815c184e3013f07781311b30ec5ff009174738", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.6424324854622013, "ground_truth": 0}, {"key": "44815c184e3013f07781311b30ec5ff009174738", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.6688802687349713, "ground_truth": 0}, {"key": "44815c184e3013f07781311b30ec5ff009174738", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.8418256486660602, "ground_truth": 0}, {"key": "44815c184e3013f07781311b30ec5ff009174738", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.5679366182409198, "ground_truth": 0}, {"key": "d7783bd2bf5ad92156962380342411c2eb068853", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.9289263272179575, "ground_truth": 0}, {"key": "d7783bd2bf5ad92156962380342411c2eb068853", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.9420819129406275, "ground_truth": 0}, {"key": "d7783bd2bf5ad92156962380342411c2eb068853", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.8783142565232802, "ground_truth": 0}, {"key": "d7783bd2bf5ad92156962380342411c2eb068853", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.8289388219160853, "ground_truth": 0}, {"key": "d7783bd2bf5ad92156962380342411c2eb068853", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.9257686257264951, "ground_truth": 0}, {"key": "4963edb0ad2703e9f6c54593149d9b81e7ada91f", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.875786984064628, "ground_truth": 0}, {"key": "4963edb0ad2703e9f6c54593149d9b81e7ada91f", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.8128673180921598, "ground_truth": 0}, {"key": "4963edb0ad2703e9f6c54593149d9b81e7ada91f", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.7371581328751309, "ground_truth": 0}, {"key": "4963edb0ad2703e9f6c54593149d9b81e7ada91f", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.7341195222160897, "ground_truth": 0}, {"key": "4963edb0ad2703e9f6c54593149d9b81e7ada91f", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.874934620905776, "ground_truth": 0}, {"key": "51b9a2d46dac43952e713874a5769be5ae350626", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.8519528210755841, "ground_truth": 0}, {"key": "51b9a2d46dac43952e713874a5769be5ae350626", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.7520125670192918, "ground_truth": 0}, {"key": "51b9a2d46dac43952e713874a5769be5ae350626", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.6352224266555536, "ground_truth": 0}, {"key": "51b9a2d46dac43952e713874a5769be5ae350626", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.851952812910124, "ground_truth": 0}, {"key": "51b9a2d46dac43952e713874a5769be5ae350626", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.7138307348999051, "ground_truth": 0}, {"key": "d670da295571f998bd0864540e2acd109d077131", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.9358173610701868, "ground_truth": 0}, {"key": "d670da295571f998bd0864540e2acd109d077131", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.8210440957265056, "ground_truth": 0}, {"key": "d670da295571f998bd0864540e2acd109d077131", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.894051719694882, "ground_truth": 0}, {"key": "d670da295571f998bd0864540e2acd109d077131", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.9385759587236688, "ground_truth": 0}, {"key": "d670da295571f998bd0864540e2acd109d077131", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.9053223007369008, "ground_truth": 0}, {"key": "f2f2246150d06734b2fab694a39bd8d693c7d255", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.7341195227824047, "ground_truth": 0}, {"key": "f2f2246150d06734b2fab694a39bd8d693c7d255", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.7931059468524706, "ground_truth": 0}, {"key": "f2f2246150d06734b2fab694a39bd8d693c7d255", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.8006919866731977, "ground_truth": 0}, {"key": "f2f2246150d06734b2fab694a39bd8d693c7d255", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.7981867800524853, "ground_truth": 0}, {"key": "f2f2246150d06734b2fab694a39bd8d693c7d255", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.7772998537633793, "ground_truth": 0}, {"key": "3cc0409612242093f34ea1d8ca1679f434955cff", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.7866228340125271, "ground_truth": 0}, {"key": "3cc0409612242093f34ea1d8ca1679f434955cff", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.9202179875356441, "ground_truth": 0}, {"key": "3cc0409612242093f34ea1d8ca1679f434955cff", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.8661325149637812, "ground_truth": 0}, {"key": "3cc0409612242093f34ea1d8ca1679f434955cff", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.8577681158353001, "ground_truth": 0}, {"key": "3cc0409612242093f34ea1d8ca1679f434955cff", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.894051717720949, "ground_truth": 0}, {"key": "a67c4eaf797da7df18a715cd30c6cf11db96c954", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.667147662619165, "ground_truth": 0}, {"key": "a67c4eaf797da7df18a715cd30c6cf11db96c954", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.8539127521625547, "ground_truth": 0}, {"key": "a67c4eaf797da7df18a715cd30c6cf11db96c954", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.6513548834243778, "ground_truth": 0}, {"key": "a67c4eaf797da7df18a715cd30c6cf11db96c954", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.8428631529441262, "ground_truth": 0}, {"key": "a67c4eaf797da7df18a715cd30c6cf11db96c954", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.7592253988258035, "ground_truth": 0}, {"key": "58456413c8bd03a8ce70eb0061af07c6a9824fc3", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.7154240030057077, "ground_truth": 0}, {"key": "58456413c8bd03a8ce70eb0061af07c6a9824fc3", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.7446563636972371, "ground_truth": 0}, {"key": "58456413c8bd03a8ce70eb0061af07c6a9824fc3", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.832236652989346, "ground_truth": 0}, {"key": "58456413c8bd03a8ce70eb0061af07c6a9824fc3", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.6187804229663857, "ground_truth": 0}, {"key": "58456413c8bd03a8ce70eb0061af07c6a9824fc3", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.7295197686613454, "ground_truth": 0}, {"key": "da040b67082b56436ccc8479a4e435cbf892a1f2", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.7577943802136166, "ground_truth": 0}, {"key": "da040b67082b56436ccc8479a4e435cbf892a1f2", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.7025300553801235, "ground_truth": 0}, {"key": "da040b67082b56436ccc8479a4e435cbf892a1f2", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.8044059228159565, "ground_truth": 0}, {"key": "da040b67082b56436ccc8479a4e435cbf892a1f2", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.8587185739941815, "ground_truth": 0}, {"key": "da040b67082b56436ccc8479a4e435cbf892a1f2", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.7866228287857834, "ground_truth": 0}, {"key": "c71748bb246a2b05e676862b75b38fa03bf6646e", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.8783142468495763, "ground_truth": 0}, {"key": "c71748bb246a2b05e676862b75b38fa03bf6646e", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.8558511486877528, "ground_truth": 0}, {"key": "c71748bb246a2b05e676862b75b38fa03bf6646e", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.8221891247797709, "ground_truth": 0}, {"key": "c71748bb246a2b05e676862b75b38fa03bf6646e", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.8233283813248301, "ground_truth": 0}, {"key": "c71748bb246a2b05e676862b75b38fa03bf6646e", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.8976952992044155, "ground_truth": 0}, {"key": "800f8dc06596c30444526bf31dd0db7504391a82", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.8438951031817385, "ground_truth": 0}, {"key": "800f8dc06596c30444526bf31dd0db7504391a82", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.8365545612419073, "ground_truth": 0}, {"key": "800f8dc06596c30444526bf31dd0db7504391a82", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.8548846304741159, "ground_truth": 0}, {"key": "800f8dc06596c30444526bf31dd0db7504391a82", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.8365545661453063, "ground_truth": 0}, {"key": "800f8dc06596c30444526bf31dd0db7504391a82", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.8998277748508205, "ground_truth": 0}, {"key": "3b0ed227dc7e5292e302183282d8bbe23d7b1db2", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.6039318316646982, "ground_truth": 0}, {"key": "3b0ed227dc7e5292e302183282d8bbe23d7b1db2", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.702530053985433, "ground_truth": 0}, {"key": "3b0ed227dc7e5292e302183282d8bbe23d7b1db2", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.5467381518960183, "ground_truth": 0}, {"key": "3b0ed227dc7e5292e302183282d8bbe23d7b1db2", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.6057990657308305, "ground_truth": 0}, {"key": "3b0ed227dc7e5292e302183282d8bbe23d7b1db2", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.6992544080683503, "ground_truth": 0}, {"key": "1e713005e16983f75222235967c0cbeb0b944f80", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.9343951608866135, "ground_truth": 0}, {"key": "1e713005e16983f75222235967c0cbeb0b944f80", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.8068526238674459, "ground_truth": 0}, {"key": "1e713005e16983f75222235967c0cbeb0b944f80", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.878314243150014, "ground_truth": 0}, {"key": "1e713005e16983f75222235967c0cbeb0b944f80", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.8333246023597477, "ground_truth": 0}, {"key": "1e713005e16983f75222235967c0cbeb0b944f80", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.8386797626269794, "ground_truth": 0}, {"key": "360ae10bc8bd30a2aca7bc6b7000e138af63adb1", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.9566342024475992, "ground_truth": 0}, {"key": "360ae10bc8bd30a2aca7bc6b7000e138af63adb1", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.9643214468291275, "ground_truth": 0}, {"key": "360ae10bc8bd30a2aca7bc6b7000e138af63adb1", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.8807970811431596, "ground_truth": 0}, {"key": "360ae10bc8bd30a2aca7bc6b7000e138af63adb1", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.9425067233364374, "ground_truth": 0}, {"key": "360ae10bc8bd30a2aca7bc6b7000e138af63adb1", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.9651191115682095, "ground_truth": 0}, {"key": "50e996059a005d15e3e89b5a3c3695309671ed34", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.8688267714118225, "ground_truth": 0}, {"key": "50e996059a005d15e3e89b5a3c3695309671ed34", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.9184802477014236, "ground_truth": 0}, {"key": "50e996059a005d15e3e89b5a3c3695309671ed34", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.8807970755718021, "ground_truth": 0}, {"key": "50e996059a005d15e3e89b5a3c3695309671ed34", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.8902942276738974, "ground_truth": 0}, {"key": "50e996059a005d15e3e89b5a3c3695309671ed34", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.8879840499103678, "ground_truth": 0}, {"key": "ccc7f6a2139593c47f6b5880f1e3eef9e7a69734", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.7154240011555741, "ground_truth": 0}, {"key": "ccc7f6a2139593c47f6b5880f1e3eef9e7a69734", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.7041601326171055, "ground_truth": 0}, {"key": "ccc7f6a2139593c47f6b5880f1e3eef9e7a69734", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.7839884794942058, "ground_truth": 0}, {"key": "ccc7f6a2139593c47f6b5880f1e3eef9e7a69734", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.7931059433202374, "ground_truth": 0}, {"key": "ccc7f6a2139593c47f6b5880f1e3eef9e7a69734", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.7356416341892286, "ground_truth": 0}, {"key": "f4f90d4ff5af3e3648055673e040f0f43ae076d2", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.8902942280733613, "ground_truth": 0}, {"key": "f4f90d4ff5af3e3648055673e040f0f43ae076d2", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.7981867759276413, "ground_truth": 0}, {"key": "f4f90d4ff5af3e3648055673e040f0f43ae076d2", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.8006919956550592, "ground_truth": 0}, {"key": "f4f90d4ff5af3e3648055673e040f0f43ae076d2", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.8449215233714932, "ground_truth": 0}, {"key": "f4f90d4ff5af3e3648055673e040f0f43ae076d2", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.84897219653881, "ground_truth": 0}, {"key": "6c9ec6b9d3e936d2394f74354d577fdfcdd985a3", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.8198933388429758, "ground_truth": 0}, {"key": "6c9ec6b9d3e936d2394f74354d577fdfcdd985a3", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.8633915999500795, "ground_truth": 0}, {"key": "6c9ec6b9d3e936d2394f74354d577fdfcdd985a3", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.7732163639382121, "ground_truth": 0}, {"key": "6c9ec6b9d3e936d2394f74354d577fdfcdd985a3", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.8832359814179092, "ground_truth": 0}, {"key": "6c9ec6b9d3e936d2394f74354d577fdfcdd985a3", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.5926665990802781, "ground_truth": 0}, {"key": "438a2046f4465fb1f6dab1cb327ef9ca86a4cc0d", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.8732148371619062, "ground_truth": 0}, {"key": "438a2046f4465fb1f6dab1cb327ef9ca86a4cc0d", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.8840392862210333, "ground_truth": 0}, {"key": "438a2046f4465fb1f6dab1cb327ef9ca86a4cc0d", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.7233094808529763, "ground_truth": 0}, {"key": "438a2046f4465fb1f6dab1cb327ef9ca86a4cc0d", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.8732148326866778, "ground_truth": 0}, {"key": "438a2046f4465fb1f6dab1cb327ef9ca86a4cc0d", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.8365545664213043, "ground_truth": 0}, {"key": "73818f6c987b3604b8bc92c4fb03bc68af196b77", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.7786493069186927, "ground_truth": 0}, {"key": "73818f6c987b3604b8bc92c4fb03bc68af196b77", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.6442251373788428, "ground_truth": 0}, {"key": "73818f6c987b3604b8bc92c4fb03bc68af196b77", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.5583269660370407, "ground_truth": 0}, {"key": "73818f6c987b3604b8bc92c4fb03bc68af196b77", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.7676898446408489, "ground_truth": 0}, {"key": "73818f6c987b3604b8bc92c4fb03bc68af196b77", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.6297746333128451, "ground_truth": 0}, {"key": "f06d91f46326752b02cdc48e8fa472dcc38a0846", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.7264256123408381, "ground_truth": 0}, {"key": "f06d91f46326752b02cdc48e8fa472dcc38a0846", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.6943026853917347, "ground_truth": 0}, {"key": "f06d91f46326752b02cdc48e8fa472dcc38a0846", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.7490872012107727, "ground_truth": 0}, {"key": "f06d91f46326752b02cdc48e8fa472dcc38a0846", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.8322366617332353, "ground_truth": 0}, {"key": "f06d91f46326752b02cdc48e8fa472dcc38a0846", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.8044059205362656, "ground_truth": 0}, {"key": "c54bee6384d58517757ad5a8a30ea6dc59980a07", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.6842640298572963, "ground_truth": 0}, {"key": "c54bee6384d58517757ad5a8a30ea6dc59980a07", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.692641988046994, "ground_truth": 0}, {"key": "c54bee6384d58517757ad5a8a30ea6dc59980a07", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.6150878463823485, "ground_truth": 0}, {"key": "c54bee6384d58517757ad5a8a30ea6dc59980a07", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.5983121811818364, "ground_truth": 0}, {"key": "c54bee6384d58517757ad5a8a30ea6dc59980a07", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.6388352795150951, "ground_truth": 0}, {"key": "2757ff294ae08e977ed6a2b6e1854210f28f12c9", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.8469578377315546, "ground_truth": 0}, {"key": "2757ff294ae08e977ed6a2b6e1854210f28f12c9", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.9263037222867572, "ground_truth": 0}, {"key": "2757ff294ae08e977ed6a2b6e1854210f28f12c9", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.9278878000808416, "ground_truth": 0}, {"key": "2757ff294ae08e977ed6a2b6e1854210f28f12c9", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.8643104483864379, "ground_truth": 0}, {"key": "2757ff294ae08e977ed6a2b6e1854210f28f12c9", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.8872046032636665, "ground_truth": 0}, {"key": "6a004c991c482f664ab8ac78df0bda26860b1c7a", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.8489721993203283, "ground_truth": 0}, {"key": "6a004c991c482f664ab8ac78df0bda26860b1c7a", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.7122321933399967, "ground_truth": 0}, {"key": "6a004c991c482f664ab8ac78df0bda26860b1c7a", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.7759445337719911, "ground_truth": 0}, {"key": "6a004c991c482f664ab8ac78df0bda26860b1c7a", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.6315943001335717, "ground_truth": 0}, {"key": "6a004c991c482f664ab8ac78df0bda26860b1c7a", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.7025300560032318, "ground_truth": 0}, {"key": "69159eadf4dcb2b7850f3a4db6454f8209f33e3a", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.8489722016474518, "ground_truth": 0}, {"key": "69159eadf4dcb2b7850f3a4db6454f8209f33e3a", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.8606036174619208, "ground_truth": 0}, {"key": "69159eadf4dcb2b7850f3a4db6454f8209f33e3a", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.806852625511346, "ground_truth": 0}, {"key": "69159eadf4dcb2b7850f3a4db6454f8209f33e3a", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.8732148253847514, "ground_truth": 0}, {"key": "69159eadf4dcb2b7850f3a4db6454f8209f33e3a", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.9092645108024796, "ground_truth": 0}, {"key": "c6129a4c1fbd5680f512da18fb60a19a74f4959e", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.919642530471396, "ground_truth": 0}, {"key": "c6129a4c1fbd5680f512da18fb60a19a74f4959e", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.7943849517140881, "ground_truth": 0}, {"key": "c6129a4c1fbd5680f512da18fb60a19a74f4959e", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.7892336972691372, "ground_truth": 0}, {"key": "c6129a4c1fbd5680f512da18fb60a19a74f4959e", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.8887587909447529, "ground_truth": 0}, {"key": "c6129a4c1fbd5680f512da18fb60a19a74f4959e", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.8832359865165619, "ground_truth": 0}, {"key": "1fe7d16db2c7a742dc1bcf04bfb8e285e7909f03", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.9362850047380298, "ground_truth": 0}, {"key": "1fe7d16db2c7a742dc1bcf04bfb8e285e7909f03", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.8679338465718988, "ground_truth": 0}, {"key": "1fe7d16db2c7a742dc1bcf04bfb8e285e7909f03", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.8615382167230081, "ground_truth": 0}, {"key": "1fe7d16db2c7a742dc1bcf04bfb8e285e7909f03", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.8606036160762737, "ground_truth": 0}, {"key": "1fe7d16db2c7a742dc1bcf04bfb8e285e7909f03", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.6619228691743095, "ground_truth": 0}, {"key": "e0ddf766661004eb3ff337d95e249073410f0755", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.8740772267466678, "ground_truth": 0}, {"key": "e0ddf766661004eb3ff337d95e249073410f0755", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.891811043304029, "ground_truth": 0}, {"key": "e0ddf766661004eb3ff337d95e249073410f0755", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.8278281480960951, "ground_truth": 0}, {"key": "e0ddf766661004eb3ff337d95e249073410f0755", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.8947894705174504, "ground_truth": 0}, {"key": "e0ddf766661004eb3ff337d95e249073410f0755", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.889528849184087, "ground_truth": 0}, {"key": "dd37d70b837b24247e9abafe8fb5bc5fae5de464", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.8529354736018087, "ground_truth": 0}, {"key": "dd37d70b837b24247e9abafe8fb5bc5fae5de464", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.8509646892014987, "ground_truth": 0}, {"key": "dd37d70b837b24247e9abafe8fb5bc5fae5de464", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.8080672036802162, "ground_truth": 0}, {"key": "dd37d70b837b24247e9abafe8fb5bc5fae5de464", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.8278281479727922, "ground_truth": 0}, {"key": "dd37d70b837b24247e9abafe8fb5bc5fae5de464", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.8509646930141854, "ground_truth": 0}, {"key": "6e3028e9ae17ab59abc7732fe840468ac9dcb60c", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.8300437629965687, "ground_truth": 0}, {"key": "6e3028e9ae17ab59abc7732fe840468ac9dcb60c", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.8092759821949405, "ground_truth": 0}, {"key": "6e3028e9ae17ab59abc7732fe840468ac9dcb60c", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.7520125634665122, "ground_truth": 0}, {"key": "6e3028e9ae17ab59abc7732fe840468ac9dcb60c", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.8175744724413666, "ground_truth": 0}, {"key": "6e3028e9ae17ab59abc7732fe840468ac9dcb60c", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.791821059425252, "ground_truth": 0}, {"key": "24d2f15f65bfb5608c75d19ba07fc410aab4d9c6", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.9805806538548014, "ground_truth": 0}, {"key": "24d2f15f65bfb5608c75d19ba07fc410aab4d9c6", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.9763105283361667, "ground_truth": 0}, {"key": "24d2f15f65bfb5608c75d19ba07fc410aab4d9c6", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.9500414772896056, "ground_truth": 0}, {"key": "24d2f15f65bfb5608c75d19ba07fc410aab4d9c6", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.9709092416909465, "ground_truth": 0}, {"key": "24d2f15f65bfb5608c75d19ba07fc410aab4d9c6", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.9594592618969385, "ground_truth": 0}, {"key": "698329cc7a8d796d7635bf59d2435aa22c1a38e6", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.9066531243572536, "ground_truth": 0}, {"key": "698329cc7a8d796d7635bf59d2435aa22c1a38e6", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.9278877971180944, "ground_truth": 0}, {"key": "698329cc7a8d796d7635bf59d2435aa22c1a38e6", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.9445872087698677, "ground_truth": 0}, {"key": "698329cc7a8d796d7635bf59d2435aa22c1a38e6", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.9711290927528073, "ground_truth": 0}, {"key": "698329cc7a8d796d7635bf59d2435aa22c1a38e6", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.8840392863641319, "ground_truth": 0}, {"key": "b531a8ba685e8d461d0a491f35c9970c3dddf3dd", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.752012570214899, "ground_truth": 0}, {"key": "b531a8ba685e8d461d0a491f35c9970c3dddf3dd", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.8548846426400625, "ground_truth": 0}, {"key": "b531a8ba685e8d461d0a491f35c9970c3dddf3dd", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.8918110431416374, "ground_truth": 0}, {"key": "b531a8ba685e8d461d0a491f35c9970c3dddf3dd", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.8940517159546335, "ground_truth": 0}, {"key": "b531a8ba685e8d461d0a491f35c9970c3dddf3dd", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.8984105541665114, "ground_truth": 0}, {"key": "5b0e686b4679910743337ce02b36dd71a5caf5eb", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.7041601268208397, "ground_truth": 0}, {"key": "5b0e686b4679910743337ce02b36dd71a5caf5eb", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.771843510086872, "ground_truth": 0}, {"key": "5b0e686b4679910743337ce02b36dd71a5caf5eb", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.6926419841793185, "ground_truth": 0}, {"key": "5b0e686b4679910743337ce02b36dd71a5caf5eb", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.7634837653322435, "ground_truth": 0}, {"key": "5b0e686b4679910743337ce02b36dd71a5caf5eb", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.6671476664930736, "ground_truth": 0}, {"key": "980e6db610d9882443d61e36d955f02d983d3e76", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.9190632869500895, "ground_truth": 0}, {"key": "980e6db610d9882443d61e36d955f02d983d3e76", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.9489172622558483, "ground_truth": 0}, {"key": "980e6db610d9882443d61e36d955f02d983d3e76", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.8175744673042957, "ground_truth": 0}, {"key": "980e6db610d9882443d61e36d955f02d983d3e76", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.9339146218663057, "ground_truth": 0}, {"key": "980e6db610d9882443d61e36d955f02d983d3e76", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.8799743644749924, "ground_truth": 0}, {"key": "6c18984d8f30ce196e9399200dd15e373e699267", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.7969253804937821, "ground_truth": 0}, {"key": "6c18984d8f30ce196e9399200dd15e373e699267", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.8175744807418612, "ground_truth": 0}, {"key": "6c18984d8f30ce196e9399200dd15e373e699267", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.7969253686891941, "ground_truth": 0}, {"key": "6c18984d8f30ce196e9399200dd15e373e699267", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.7233094760256067, "ground_truth": 0}, {"key": "6c18984d8f30ce196e9399200dd15e373e699267", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.6909762904283493, "ground_truth": 0}, {"key": "e00f05efe2038fffc8eaa1e8eecbe9445a9483e5", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.76207010119399, "ground_truth": 0}, {"key": "e00f05efe2038fffc8eaa1e8eecbe9445a9483e5", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.9263037225960767, "ground_truth": 0}, {"key": "e00f05efe2038fffc8eaa1e8eecbe9445a9483e5", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.8376199709982912, "ground_truth": 0}, {"key": "e00f05efe2038fffc8eaa1e8eecbe9445a9483e5", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.7943849460714312, "ground_truth": 0}, {"key": "e00f05efe2038fffc8eaa1e8eecbe9445a9483e5", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.8469578362485163, "ground_truth": 0}, {"key": "9ce109dc50fe4eca8b2d0c926d5dbd1df5f49187", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.8688267729370108, "ground_truth": 0}, {"key": "9ce109dc50fe4eca8b2d0c926d5dbd1df5f49187", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.8044059176902209, "ground_truth": 0}, {"key": "9ce109dc50fe4eca8b2d0c926d5dbd1df5f49187", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.8732148370361488, "ground_truth": 0}, {"key": "9ce109dc50fe4eca8b2d0c926d5dbd1df5f49187", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.8661325036905476, "ground_truth": 0}, {"key": "9ce109dc50fe4eca8b2d0c926d5dbd1df5f49187", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.8289388157918732, "ground_truth": 0}, {"key": "bbec538b4453859ee9c772c4de8f0eb28acd87c4", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.7981867884217363, "ground_truth": 0}, {"key": "bbec538b4453859ee9c772c4de8f0eb28acd87c4", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.7592253928651048, "ground_truth": 0}, {"key": "bbec538b4453859ee9c772c4de8f0eb28acd87c4", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.8596637439828737, "ground_truth": 0}, {"key": "bbec538b4453859ee9c772c4de8f0eb28acd87c4", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.7461390016433782, "ground_truth": 0}, {"key": "bbec538b4453859ee9c772c4de8f0eb28acd87c4", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.8991213815087489, "ground_truth": 0}, {"key": "c4e0587d1b8fcc06c2cc5cfcec42a34d314fbe44", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.8615382151031414, "ground_truth": 0}, {"key": "c4e0587d1b8fcc06c2cc5cfcec42a34d314fbe44", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.9124361597526495, "ground_truth": 0}, {"key": "c4e0587d1b8fcc06c2cc5cfcec42a34d314fbe44", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.9532750411790903, "ground_truth": 0}, {"key": "c4e0587d1b8fcc06c2cc5cfcec42a34d314fbe44", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.9026096011359458, "ground_truth": 0}, {"key": "c4e0587d1b8fcc06c2cc5cfcec42a34d314fbe44", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.9149009562353086, "ground_truth": 0}, {"key": "7eaaa5bfe35344ee85eeb871a4d31cd31b12965b", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.8489722018548447, "ground_truth": 0}, {"key": "7eaaa5bfe35344ee85eeb871a4d31cd31b12965b", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.8887587833954008, "ground_truth": 0}, {"key": "7eaaa5bfe35344ee85eeb871a4d31cd31b12965b", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.850964695767996, "ground_truth": 0}, {"key": "7eaaa5bfe35344ee85eeb871a4d31cd31b12965b", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.8459424433949204, "ground_truth": 0}, {"key": "7eaaa5bfe35344ee85eeb871a4d31cd31b12965b", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.8643104570101758, "ground_truth": 0}, {"key": "9cce7373a54faccf5b5d1232c82afab9b29ab6b9", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.8955226730239602, "ground_truth": 0}, {"key": "9cce7373a54faccf5b5d1232c82afab9b29ab6b9", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.903974520575938, "ground_truth": 0}, {"key": "9cce7373a54faccf5b5d1232c82afab9b29ab6b9", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.9190632933167703, "ground_truth": 0}, {"key": "9cce7373a54faccf5b5d1232c82afab9b29ab6b9", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.9219218317147965, "ground_truth": 0}, {"key": "9cce7373a54faccf5b5d1232c82afab9b29ab6b9", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.8816149059479801, "ground_truth": 0}, {"key": "1b37e549bbcec859711e5b2ef310e94deed4dc95", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.9543079690222867, "ground_truth": 0}, {"key": "1b37e549bbcec859711e5b2ef310e94deed4dc95", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.9820137900631611, "ground_truth": 0}, {"key": "1b37e549bbcec859711e5b2ef310e94deed4dc95", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.8933094067479966, "ground_truth": 0}, {"key": "1b37e549bbcec859711e5b2ef310e94deed4dc95", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.8925625221068343, "ground_truth": 0}, {"key": "1b37e549bbcec859711e5b2ef310e94deed4dc95", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.966914023507141, "ground_truth": 0}, {"key": "da780ee614304d195bde3b7549313c02990d072e", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.9130583425992398, "ground_truth": 0}, {"key": "da780ee614304d195bde3b7549313c02990d072e", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.8697145809019322, "ground_truth": 0}, {"key": "da780ee614304d195bde3b7549313c02990d072e", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.8311430536208088, "ground_truth": 0}, {"key": "da780ee614304d195bde3b7549313c02990d072e", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.8933094056003378, "ground_truth": 0}, {"key": "da780ee614304d195bde3b7549313c02990d072e", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.8056321958975294, "ground_truth": 0}, {"key": "e24cdc200182d698a34f564ba71f4948ce6760e5", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.8670357508723902, "ground_truth": 0}, {"key": "e24cdc200182d698a34f564ba71f4948ce6760e5", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.8732148317426873, "ground_truth": 0}, {"key": "e24cdc200182d698a34f564ba71f4948ce6760e5", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.8832359967420428, "ground_truth": 0}, {"key": "e24cdc200182d698a34f564ba71f4948ce6760e5", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.9477691442973394, "ground_truth": 0}, {"key": "e24cdc200182d698a34f564ba71f4948ce6760e5", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.9026095990508278, "ground_truth": 0}, {"key": "42483672c204aebcf7ba6e7d6ca4c628fe9a69e7", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.9012274157688228, "ground_truth": 0}, {"key": "42483672c204aebcf7ba6e7d6ca4c628fe9a69e7", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.8955226815155595, "ground_truth": 0}, {"key": "42483672c204aebcf7ba6e7d6ca4c628fe9a69e7", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.9111797077951149, "ground_truth": 0}, {"key": "42483672c204aebcf7ba6e7d6ca4c628fe9a69e7", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.9111797063533986, "ground_truth": 0}, {"key": "42483672c204aebcf7ba6e7d6ca4c628fe9a69e7", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.9268352783976203, "ground_truth": 0}, {"key": "3501c83d3dab4a2e4d2142522a4bf1510a64422a", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.8344068780634011, "ground_truth": 0}, {"key": "3501c83d3dab4a2e4d2142522a4bf1510a64422a", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.7185944051135872, "ground_truth": 0}, {"key": "3501c83d3dab4a2e4d2142522a4bf1510a64422a", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.8255897180999915, "ground_truth": 0}, {"key": "3501c83d3dab4a2e4d2142522a4bf1510a64422a", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.6876300059434728, "ground_truth": 0}, {"key": "3501c83d3dab4a2e4d2142522a4bf1510a64422a", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.7505527591648886, "ground_truth": 0}, {"key": "964589248c2d95ac3c734ad71283ca22ae4ecedf", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.8152324873052137, "ground_truth": 0}, {"key": "964589248c2d95ac3c734ad71283ca22ae4ecedf", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.945399393519822, "ground_truth": 0}, {"key": "964589248c2d95ac3c734ad71283ca22ae4ecedf", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.9012274053935916, "ground_truth": 0}, {"key": "964589248c2d95ac3c734ad71283ca22ae4ecedf", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.9066531191740119, "ground_truth": 0}, {"key": "964589248c2d95ac3c734ad71283ca22ae4ecedf", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.8633916077289353, "ground_truth": 0}, {"key": "6b72550a663bcb7a64e242ede6da53b1f585ea71", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.8128673147633135, "ground_truth": 0}, {"key": "6b72550a663bcb7a64e242ede6da53b1f585ea71", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.8376199657479194, "ground_truth": 0}, {"key": "6b72550a663bcb7a64e242ede6da53b1f585ea71", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.8289388123382823, "ground_truth": 0}, {"key": "6b72550a663bcb7a64e242ede6da53b1f585ea71", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.7090191271983387, "ground_truth": 0}, {"key": "6b72550a663bcb7a64e242ede6da53b1f585ea71", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.8705972703667616, "ground_truth": 0}, {"key": "c96bdfc0463d994ddc858ad358fe59371be79352", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.7371581516195664, "ground_truth": 0}, {"key": "c96bdfc0463d994ddc858ad358fe59371be79352", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.9246876939169314, "ground_truth": 0}, {"key": "c96bdfc0463d994ddc858ad358fe59371be79352", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.7592254037828615, "ground_truth": 0}, {"key": "c96bdfc0463d994ddc858ad358fe59371be79352", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.8354835425084797, "ground_truth": 0}, {"key": "c96bdfc0463d994ddc858ad358fe59371be79352", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.901227411887209, "ground_truth": 0}, {"key": "085dc5d706487da983655043b144952956cb3c5b", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.649578640934133, "ground_truth": 0}, {"key": "085dc5d706487da983655043b144952956cb3c5b", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.7248702794720957, "ground_truth": 0}, {"key": "085dc5d706487da983655043b144952956cb3c5b", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.8210440947794417, "ground_truth": 0}, {"key": "085dc5d706487da983655043b144952956cb3c5b", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.6406358489098675, "ground_truth": 0}, {"key": "085dc5d706487da983655043b144952956cb3c5b", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.7879311943641446, "ground_truth": 0}, {"key": "1c1dc1da2f6ba045478e25e91c8e1b039ce4cc67", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.8438950893090094, "ground_truth": 0}, {"key": "1c1dc1da2f6ba045478e25e91c8e1b039ce4cc67", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.9489172606108099, "ground_truth": 0}, {"key": "1c1dc1da2f6ba045478e25e91c8e1b039ce4cc67", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.6740504991432196, "ground_truth": 0}, {"key": "1c1dc1da2f6ba045478e25e91c8e1b039ce4cc67", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.740174356112953, "ground_truth": 0}, {"key": "1c1dc1da2f6ba045478e25e91c8e1b039ce4cc67", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.8679338500558377, "ground_truth": 0}, {"key": "da90eb668bfc66a5e70b2e6631a5ec1c9ffb2413", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.897695291028375, "ground_truth": 0}, {"key": "da90eb668bfc66a5e70b2e6631a5ec1c9ffb2413", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.8749346151984582, "ground_truth": 0}, {"key": "da90eb668bfc66a5e70b2e6631a5ec1c9ffb2413", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.8824278626050628, "ground_truth": 0}, {"key": "da90eb668bfc66a5e70b2e6631a5ec1c9ffb2413", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.9661559678549775, "ground_truth": 0}, {"key": "da90eb668bfc66a5e70b2e6631a5ec1c9ffb2413", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.9458012719714319, "ground_truth": 0}, {"key": "717b1934db9eb0d7e5e2aef75cd54b29a6530a59", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.5428632784117449, "ground_truth": 0}, {"key": "717b1934db9eb0d7e5e2aef75cd54b29a6530a59", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.6057990522363914, "ground_truth": 0}, {"key": "717b1934db9eb0d7e5e2aef75cd54b29a6530a59", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.8624675276289814, "ground_truth": 0}, {"key": "717b1934db9eb0d7e5e2aef75cd54b29a6530a59", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.7772998642358522, "ground_truth": 0}, {"key": "717b1934db9eb0d7e5e2aef75cd54b29a6530a59", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.8080672068861422, "ground_truth": 0}, {"key": "e493fe7f282adb10c6b9af18d41f0181f17341e5", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.8386797506369943, "ground_truth": 0}, {"key": "e493fe7f282adb10c6b9af18d41f0181f17341e5", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.8092759759822878, "ground_truth": 0}, {"key": "e493fe7f282adb10c6b9af18d41f0181f17341e5", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.7310585590814027, "ground_truth": 0}, {"key": "e493fe7f282adb10c6b9af18d41f0181f17341e5", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.8376199631184434, "ground_truth": 0}, {"key": "e493fe7f282adb10c6b9af18d41f0181f17341e5", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.8489721951328055, "ground_truth": 0}, {"key": "e510fc72b8ef595e45f1a510d0cad761ae1bd032", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.7981867854486094, "ground_truth": 0}, {"key": "e510fc72b8ef595e45f1a510d0cad761ae1bd032", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.7956580944172758, "ground_truth": 0}, {"key": "e510fc72b8ef595e45f1a510d0cad761ae1bd032", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.7732163671381237, "ground_truth": 0}, {"key": "e510fc72b8ef595e45f1a510d0cad761ae1bd032", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.5097643646751462, "ground_truth": 0}, {"key": "e510fc72b8ef595e45f1a510d0cad761ae1bd032", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.7606506612539164, "ground_truth": 0}, {"key": "564e02cb944ea00c02f9832ab968441b5c67332e", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.8558511437907531, "ground_truth": 0}, {"key": "564e02cb944ea00c02f9832ab968441b5c67332e", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.9099070018709855, "ground_truth": 0}, {"key": "564e02cb944ea00c02f9832ab968441b5c67332e", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.7577943776496836, "ground_truth": 0}, {"key": "564e02cb944ea00c02f9832ab968441b5c67332e", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.8031737904924926, "ground_truth": 0}, {"key": "564e02cb944ea00c02f9832ab968441b5c67332e", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.8152324805722332, "ground_truth": 0}, {"key": "dfd0cea6589cb8be40538b9f165781fbc2c7d796", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.9207896774382779, "ground_truth": 0}, {"key": "dfd0cea6589cb8be40538b9f165781fbc2c7d796", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.7866228280054136, "ground_truth": 0}, {"key": "dfd0cea6589cb8be40538b9f165781fbc2c7d796", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.903974508756577, "ground_truth": 0}, {"key": "dfd0cea6589cb8be40538b9f165781fbc2c7d796", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.8233283886005914, "ground_truth": 0}, {"key": "dfd0cea6589cb8be40538b9f165781fbc2c7d796", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.762070099252775, "ground_truth": 0}, {"key": "dbceded6ea7d8a0944ab3f44263f688f644a5c37", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.6859494594317018, "ground_truth": 0}, {"key": "dbceded6ea7d8a0944ab3f44263f688f644a5c37", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.700894799512896, "ground_truth": 0}, {"key": "dbceded6ea7d8a0944ab3f44263f688f644a5c37", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.7853085816663425, "ground_truth": 0}, {"key": "dbceded6ea7d8a0944ab3f44263f688f644a5c37", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.7676898558721091, "ground_truth": 0}, {"key": "dbceded6ea7d8a0944ab3f44263f688f644a5c37", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.8221891192482814, "ground_truth": 0}, {"key": "305a7272b28da5bc5574487ca0a09f48b852788c", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.8596637555487977, "ground_truth": 0}, {"key": "305a7272b28da5bc5574487ca0a09f48b852788c", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.8210441084818284, "ground_truth": 0}, {"key": "305a7272b28da5bc5574487ca0a09f48b852788c", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.8300437675249017, "ground_truth": 0}, {"key": "305a7272b28da5bc5574487ca0a09f48b852788c", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.8714748656097494, "ground_truth": 0}, {"key": "305a7272b28da5bc5574487ca0a09f48b852788c", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.8397339650400444, "ground_truth": 0}, {"key": "9814600b03458475607fa2e4e9f1637138b7c9bf", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.7371581494389348, "ground_truth": 0}, {"key": "9814600b03458475607fa2e4e9f1637138b7c9bf", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.8925625196647059, "ground_truth": 0}, {"key": "9814600b03458475607fa2e4e9f1637138b7c9bf", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.7745833989665898, "ground_truth": 0}, {"key": "9814600b03458475607fa2e4e9f1637138b7c9bf", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.757794373431387, "ground_truth": 0}, {"key": "9814600b03458475607fa2e4e9f1637138b7c9bf", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.795658098239787, "ground_truth": 0}, {"key": "d16bff688345742ee8a1762cb6b82b49e4a065dd", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.7662936331316224, "ground_truth": 0}, {"key": "d16bff688345742ee8a1762cb6b82b49e4a065dd", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.8489722003832237, "ground_truth": 0}, {"key": "d16bff688345742ee8a1762cb6b82b49e4a065dd", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.7786492947379758, "ground_truth": 0}, {"key": "d16bff688345742ee8a1762cb6b82b49e4a065dd", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.8300437534325978, "ground_truth": 0}, {"key": "d16bff688345742ee8a1762cb6b82b49e4a065dd", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.8548846425902179, "ground_truth": 0}, {"key": "c85a7eb698c39c7465d1fe4ebbb50447329b5497", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.9623913624352813, "ground_truth": 0}, {"key": "c85a7eb698c39c7465d1fe4ebbb50447329b5497", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.990140144897106, "ground_truth": 0}, {"key": "c85a7eb698c39c7465d1fe4ebbb50447329b5497", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.967899292486577, "ground_truth": 0}, {"key": "c85a7eb698c39c7465d1fe4ebbb50447329b5497", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.9674102565279088, "ground_truth": 0}, {"key": "c85a7eb698c39c7465d1fe4ebbb50447329b5497", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.9496693652504595, "ground_truth": 0}, {"key": "5f299d74b492be5e53e6bcf3a54d3c8a4b418a97", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.5983121952111594, "ground_truth": 0}, {"key": "5f299d74b492be5e53e6bcf3a54d3c8a4b418a97", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.6224593246113134, "ground_truth": 0}, {"key": "5f299d74b492be5e53e6bcf3a54d3c8a4b418a97", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.5039061611996365, "ground_truth": 0}, {"key": "5f299d74b492be5e53e6bcf3a54d3c8a4b418a97", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.8902942286673168, "ground_truth": 0}, {"key": "5f299d74b492be5e53e6bcf3a54d3c8a4b418a97", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.596433119523999, "ground_truth": 0}, {"key": "5a4e46a4e18d31d1ef4d1087b1643a349f10dd14", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.7866228018424778, "ground_truth": 0}, {"key": "5a4e46a4e18d31d1ef4d1087b1643a349f10dd14", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.8757869919040558, "ground_truth": 0}, {"key": "5a4e46a4e18d31d1ef4d1087b1643a349f10dd14", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.8152324938504624, "ground_truth": 0}, {"key": "5a4e46a4e18d31d1ef4d1087b1643a349f10dd14", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.7994422987925857, "ground_truth": 0}, {"key": "5a4e46a4e18d31d1ef4d1087b1643a349f10dd14", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.7745833847124981, "ground_truth": 0}, {"key": "b6b7cbc40f51483708d53416719205f36c06f6df", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.8925625291094601, "ground_truth": 0}, {"key": "b6b7cbc40f51483708d53416719205f36c06f6df", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.8267117971381129, "ground_truth": 0}, {"key": "b6b7cbc40f51483708d53416719205f36c06f6df", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.927887800947527, "ground_truth": 0}, {"key": "b6b7cbc40f51483708d53416719205f36c06f6df", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.8596637504765029, "ground_truth": 0}, {"key": "b6b7cbc40f51483708d53416719205f36c06f6df", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.8596637493090091, "ground_truth": 0}, {"key": "7c0bda3744be6f7d95eef695e59a4e4001455a35", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.8244619334489436, "ground_truth": 0}, {"key": "7c0bda3744be6f7d95eef695e59a4e4001455a35", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.8774767897864754, "ground_truth": 0}, {"key": "7c0bda3744be6f7d95eef695e59a4e4001455a35", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.9304582567860074, "ground_truth": 0}, {"key": "7c0bda3744be6f7d95eef695e59a4e4001455a35", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.8558511453133806, "ground_truth": 0}, {"key": "7c0bda3744be6f7d95eef695e59a4e4001455a35", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.8519528112041906, "ground_truth": 0}, {"key": "f19b17438e69527f376e5d9efc74d19fbac6f755", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.8376199667865002, "ground_truth": 0}, {"key": "f19b17438e69527f376e5d9efc74d19fbac6f755", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.8128673147348113, "ground_truth": 0}, {"key": "f19b17438e69527f376e5d9efc74d19fbac6f755", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.858718576571537, "ground_truth": 0}, {"key": "f19b17438e69527f376e5d9efc74d19fbac6f755", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.879146772653961, "ground_truth": 0}, {"key": "f19b17438e69527f376e5d9efc74d19fbac6f755", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.7772998592976901, "ground_truth": 0}, {"key": "eb2fe21af9629392d61a4fabe6cad72130525f2f", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.5097643634518499, "ground_truth": 0}, {"key": "eb2fe21af9629392d61a4fabe6cad72130525f2f", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.7534666656938409, "ground_truth": 0}, {"key": "eb2fe21af9629392d61a4fabe6cad72130525f2f", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.7956580892604296, "ground_truth": 0}, {"key": "eb2fe21af9629392d61a4fabe6cad72130525f2f", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.7704648023569308, "ground_truth": 0}, {"key": "eb2fe21af9629392d61a4fabe6cad72130525f2f", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.7690802433864962, "ground_truth": 0}, {"key": "eebebdc4fa08a6e927ab958a39d91f888550afec", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.8289388038953629, "ground_truth": 0}, {"key": "eebebdc4fa08a6e927ab958a39d91f888550afec", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.8757869919040558, "ground_truth": 0}, {"key": "eebebdc4fa08a6e927ab958a39d91f888550afec", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.9012274129348329, "ground_truth": 0}, {"key": "eebebdc4fa08a6e927ab958a39d91f888550afec", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.7943849560411116, "ground_truth": 0}, {"key": "eebebdc4fa08a6e927ab958a39d91f888550afec", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.8652240799397499, "ground_truth": 0}, {"key": "94b15ad6efcd6d47dfcc242135be481fceb7f634", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.7431680163586597, "ground_truth": 0}, {"key": "94b15ad6efcd6d47dfcc242135be481fceb7f634", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.919063292657962, "ground_truth": 0}, {"key": "94b15ad6efcd6d47dfcc242135be481fceb7f634", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.8519528027983254, "ground_truth": 0}, {"key": "94b15ad6efcd6d47dfcc242135be481fceb7f634", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.8311430603940116, "ground_truth": 0}, {"key": "94b15ad6efcd6d47dfcc242135be481fceb7f634", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.8479677695453688, "ground_truth": 0}, {"key": "504ed83e41a6a861927345f7a027ba53ad02237a", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.9092645160538836, "ground_truth": 0}, {"key": "504ed83e41a6a861927345f7a027ba53ad02237a", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.8479677483130239, "ground_truth": 0}, {"key": "504ed83e41a6a861927345f7a027ba53ad02237a", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.8068526164616694, "ground_truth": 0}, {"key": "504ed83e41a6a861927345f7a027ba53ad02237a", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.8548846340367979, "ground_truth": 0}, {"key": "504ed83e41a6a861927345f7a027ba53ad02237a", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.9149009580671237, "ground_truth": 0}, {"key": "42176b852f897ae19ef0cf39d598878c8ff0bced", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.7786493083681201, "ground_truth": 0}, {"key": "42176b852f897ae19ef0cf39d598878c8ff0bced", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.743168006763596, "ground_truth": 0}, {"key": "42176b852f897ae19ef0cf39d598878c8ff0bced", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.7490871995582933, "ground_truth": 0}, {"key": "42176b852f897ae19ef0cf39d598878c8ff0bced", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.6424324600073662, "ground_truth": 0}, {"key": "42176b852f897ae19ef0cf39d598878c8ff0bced", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.6992544194722933, "ground_truth": 0}, {"key": "62ac534bf7e3e897b2726dddf2b7b6f7723362d4", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.887204599945285, "ground_truth": 0}, {"key": "62ac534bf7e3e897b2726dddf2b7b6f7723362d4", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.8116760075198693, "ground_truth": 0}, {"key": "62ac534bf7e3e897b2726dddf2b7b6f7723362d4", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.9358173525351556, "ground_truth": 0}, {"key": "62ac534bf7e3e897b2726dddf2b7b6f7723362d4", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.8509646970846914, "ground_truth": 0}, {"key": "62ac534bf7e3e897b2726dddf2b7b6f7723362d4", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.9032942165617258, "ground_truth": 0}, {"key": "4ff05ae8454ad482f81911c5e4275b63466bea35", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.8887587767995858, "ground_truth": 0}, {"key": "4ff05ae8454ad482f81911c5e4275b63466bea35", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.8529354694486211, "ground_truth": 0}, {"key": "4ff05ae8454ad482f81911c5e4275b63466bea35", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.8479677599561514, "ground_truth": 0}, {"key": "4ff05ae8454ad482f81911c5e4275b63466bea35", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.8879840455622375, "ground_truth": 0}, {"key": "4ff05ae8454ad482f81911c5e4275b63466bea35", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.8940517204553425, "ground_truth": 0}, {"key": "16e86dc5e3fe27875ee927741542536ea7b7553b", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.8879840483323349, "ground_truth": 0}, {"key": "16e86dc5e3fe27875ee927741542536ea7b7553b", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.8489721982322044, "ground_truth": 0}, {"key": "16e86dc5e3fe27875ee927741542536ea7b7553b", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.7505527660730207, "ground_truth": 0}, {"key": "16e86dc5e3fe27875ee927741542536ea7b7553b", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.842863142157526, "ground_truth": 0}, {"key": "16e86dc5e3fe27875ee927741542536ea7b7553b", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.8679338543640482, "ground_truth": 0}, {"key": "ad55d2f13db6732edcd716e09f527ed2df39946f", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.724870279718646, "ground_truth": 0}, {"key": "ad55d2f13db6732edcd716e09f527ed2df39946f", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.5926666002012747, "ground_truth": 0}, {"key": "ad55d2f13db6732edcd716e09f527ed2df39946f", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.7839884788662415, "ground_truth": 0}, {"key": "ad55d2f13db6732edcd716e09f527ed2df39946f", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.8438950942056781, "ground_truth": 0}, {"key": "ad55d2f13db6732edcd716e09f527ed2df39946f", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.5755880090282125, "ground_truth": 0}, {"key": "160228fe18f272761b969b08622ba868ad65b206", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.9706877688893863, "ground_truth": 0}, {"key": "160228fe18f272761b969b08622ba868ad65b206", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.7745833965075475, "ground_truth": 0}, {"key": "160228fe18f272761b969b08622ba868ad65b206", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.9202179853886062, "ground_truth": 0}, {"key": "160228fe18f272761b969b08622ba868ad65b206", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.9536217904050728, "ground_truth": 0}, {"key": "160228fe18f272761b969b08622ba868ad65b206", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.8661325164201633, "ground_truth": 0}, {"key": "7ebb75bc91aa51d53b06fdbed7feb52d42612065", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.933914623458897, "ground_truth": 0}, {"key": "7ebb75bc91aa51d53b06fdbed7feb52d42612065", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.9549844676520168, "ground_truth": 0}, {"key": "7ebb75bc91aa51d53b06fdbed7feb52d42612065", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.9525741309159699, "ground_truth": 0}, {"key": "7ebb75bc91aa51d53b06fdbed7feb52d42612065", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.8969755640819689, "ground_truth": 0}, {"key": "7ebb75bc91aa51d53b06fdbed7feb52d42612065", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.9504109747604289, "ground_truth": 0}, {"key": "a84e31bf36290e557a3080ad297177b6f18cdf84", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.8766343661747918, "ground_truth": 0}, {"key": "a84e31bf36290e557a3080ad297177b6f18cdf84", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.8198933415693512, "ground_truth": 0}, {"key": "a84e31bf36290e557a3080ad297177b6f18cdf84", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.8418256473399034, "ground_truth": 0}, {"key": "a84e31bf36290e557a3080ad297177b6f18cdf84", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.9178933685598549, "ground_truth": 0}, {"key": "a84e31bf36290e557a3080ad297177b6f18cdf84", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.911809952645947, "ground_truth": 0}, {"key": "c43c7253f38ff2cd79770034ed9af3567cfaa811", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.9092645162916317, "ground_truth": 0}, {"key": "c43c7253f38ff2cd79770034ed9af3567cfaa811", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.8840392854580522, "ground_truth": 0}, {"key": "c43c7253f38ff2cd79770034ed9af3567cfaa811", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.8539127549293796, "ground_truth": 0}, {"key": "c43c7253f38ff2cd79770034ed9af3567cfaa811", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.7620700914326766, "ground_truth": 0}, {"key": "c43c7253f38ff2cd79770034ed9af3567cfaa811", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.8652240899344557, "ground_truth": 0}, {"key": "a4601415eafb5264a4bdc273de3a16365aefb35b", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.9173026547786065, "ground_truth": 0}, {"key": "a4601415eafb5264a4bdc273de3a16365aefb35b", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.8824278635525279, "ground_truth": 0}, {"key": "a4601415eafb5264a4bdc273de3a16365aefb35b", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.8278281430326363, "ground_truth": 0}, {"key": "a4601415eafb5264a4bdc273de3a16365aefb35b", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.7025300424620523, "ground_truth": 0}, {"key": "a4601415eafb5264a4bdc273de3a16365aefb35b", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.8606036218406639, "ground_truth": 0}, {"key": "91d43f137b3d928561fb62b200ae40aee4a34b73", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.7620700923960965, "ground_truth": 0}, {"key": "91d43f137b3d928561fb62b200ae40aee4a34b73", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.8783142499813464, "ground_truth": 0}, {"key": "91d43f137b3d928561fb62b200ae40aee4a34b73", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.8044059217567958, "ground_truth": 0}, {"key": "91d43f137b3d928561fb62b200ae40aee4a34b73", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.8519528103607201, "ground_truth": 0}, {"key": "91d43f137b3d928561fb62b200ae40aee4a34b73", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.8643104556289651, "ground_truth": 0}, {"key": "ab2d99eedfd685ce685fa44e735695c27e946683", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.8558511513581681, "ground_truth": 0}, {"key": "ab2d99eedfd685ce685fa44e735695c27e946683", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.8910549588711992, "ground_truth": 0}, {"key": "ab2d99eedfd685ce685fa44e735695c27e946683", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.8244619279859866, "ground_truth": 0}, {"key": "ab2d99eedfd685ce685fa44e735695c27e946683", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.8056321777635851, "ground_truth": 0}, {"key": "ab2d99eedfd685ce685fa44e735695c27e946683", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.8624675250577867, "ground_truth": 0}, {"key": "df9c4e1b8698581720b28c71f1e98f82bd6ea6e6", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.8652240785691602, "ground_truth": 0}, {"key": "df9c4e1b8698581720b28c71f1e98f82bd6ea6e6", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.8187367986614319, "ground_truth": 0}, {"key": "df9c4e1b8698581720b28c71f1e98f82bd6ea6e6", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.6132365712150556, "ground_truth": 0}, {"key": "df9c4e1b8698581720b28c71f1e98f82bd6ea6e6", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.8438951024767309, "ground_truth": 0}, {"key": "df9c4e1b8698581720b28c71f1e98f82bd6ea6e6", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.752012563718145, "ground_truth": 0}, {"key": "a1d7a119707506100920e1a6f0d9cbf4d4e7c838", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.6671476770838007, "ground_truth": 0}, {"key": "a1d7a119707506100920e1a6f0d9cbf4d4e7c838", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.7401743519761174, "ground_truth": 0}, {"key": "a1d7a119707506100920e1a6f0d9cbf4d4e7c838", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.7310585727582132, "ground_truth": 0}, {"key": "a1d7a119707506100920e1a6f0d9cbf4d4e7c838", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.7905303063666174, "ground_truth": 0}, {"key": "a1d7a119707506100920e1a6f0d9cbf4d4e7c838", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.7090191193669683, "ground_truth": 0}, {"key": "acd2b851b367bf62dd603ebff5670ffa9c853a8f", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.7918210728044366, "ground_truth": 0}, {"key": "acd2b851b367bf62dd603ebff5670ffa9c853a8f", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.567936617617036, "ground_truth": 0}, {"key": "acd2b851b367bf62dd603ebff5670ffa9c853a8f", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.7461389867367219, "ground_truth": 0}, {"key": "acd2b851b367bf62dd603ebff5670ffa9c853a8f", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.7185943865479926, "ground_truth": 0}, {"key": "acd2b851b367bf62dd603ebff5670ffa9c853a8f", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.7386690734047581, "ground_truth": 0}, {"key": "b9f5a02386adb698ae71cadd3fd1825fa7b998db", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.6352224416269138, "ground_truth": 0}, {"key": "b9f5a02386adb698ae71cadd3fd1825fa7b998db", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.7310585598212653, "ground_truth": 0}, {"key": "b9f5a02386adb698ae71cadd3fd1825fa7b998db", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.5640984818709517, "ground_truth": 0}, {"key": "b9f5a02386adb698ae71cadd3fd1825fa7b998db", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.7295197651273548, "ground_truth": 0}, {"key": "b9f5a02386adb698ae71cadd3fd1825fa7b998db", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.5506073735011362, "ground_truth": 0}, {"key": "c26f356dc536e5797ba550be6e27a95059f1ce53", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.7185944067718201, "ground_truth": 0}, {"key": "c26f356dc536e5797ba550be6e27a95059f1ce53", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.5964331191246923, "ground_truth": 0}, {"key": "c26f356dc536e5797ba550be6e27a95059f1ce53", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.7371581417864503, "ground_truth": 0}, {"key": "c26f356dc536e5797ba550be6e27a95059f1ce53", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.6187804199331273, "ground_truth": 0}, {"key": "c26f356dc536e5797ba550be6e27a95059f1ce53", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.7549149891862444, "ground_truth": 0}, {"key": "94a9883a283e94c3ad53069d98517b08e8853447", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.8548846407276883, "ground_truth": 0}, {"key": "94a9883a283e94c3ad53069d98517b08e8853447", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.907312222585778, "ground_truth": 0}, {"key": "94a9883a283e94c3ad53069d98517b08e8853447", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.8824278615496782, "ground_truth": 0}, {"key": "94a9883a283e94c3ad53069d98517b08e8853447", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.8688267833264716, "ground_truth": 0}, {"key": "94a9883a283e94c3ad53069d98517b08e8853447", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.8832359875478912, "ground_truth": 0}, {"key": "9c02ebeda5d84859eb36070de7e8a9517ac3fee6", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.9656413103602429, "ground_truth": 0}, {"key": "9c02ebeda5d84859eb36070de7e8a9517ac3fee6", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.8918110387783375, "ground_truth": 0}, {"key": "9c02ebeda5d84859eb36070de7e8a9517ac3fee6", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.8740772317341152, "ground_truth": 0}, {"key": "9c02ebeda5d84859eb36070de7e8a9517ac3fee6", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.8918110454621967, "ground_truth": 0}, {"key": "9c02ebeda5d84859eb36070de7e8a9517ac3fee6", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.9329437112123742, "ground_truth": 0}, {"key": "37ab3a49bb7732e145a24e70e6f077469ca1dbd3", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.9563089435017673, "ground_truth": 0}, {"key": "37ab3a49bb7732e145a24e70e6f077469ca1dbd3", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.8799743735210962, "ground_truth": 0}, {"key": "37ab3a49bb7732e145a24e70e6f077469ca1dbd3", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.8840392924697739, "ground_truth": 0}, {"key": "37ab3a49bb7732e145a24e70e6f077469ca1dbd3", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.9532750420231358, "ground_truth": 0}, {"key": "37ab3a49bb7732e145a24e70e6f077469ca1dbd3", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.9178933711214621, "ground_truth": 0}, {"key": "fa67b52d4597e227947776fd40a4b16f402ed12d", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.8643104485361854, "ground_truth": 0}, {"key": "fa67b52d4597e227947776fd40a4b16f402ed12d", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.7356416267490428, "ground_truth": 0}, {"key": "fa67b52d4597e227947776fd40a4b16f402ed12d", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.6636689515720152, "ground_truth": 0}, {"key": "fa67b52d4597e227947776fd40a4b16f402ed12d", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.8624675335184154, "ground_truth": 0}, {"key": "fa67b52d4597e227947776fd40a4b16f402ed12d", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.8984105503992951, "ground_truth": 0}, {"key": "cafb6a9801a85984042abcd7e552d1e129dff4cf", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.7994423065282329, "ground_truth": 0}, {"key": "cafb6a9801a85984042abcd7e552d1e129dff4cf", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.8092759704187091, "ground_truth": 0}, {"key": "cafb6a9801a85984042abcd7e552d1e129dff4cf", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.8438950985693119, "ground_truth": 0}, {"key": "cafb6a9801a85984042abcd7e552d1e129dff4cf", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.7866228217979934, "ground_truth": 0}, {"key": "cafb6a9801a85984042abcd7e552d1e129dff4cf", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.8479677522605324, "ground_truth": 0}, {"key": "12a24b1aba082a5fd0687a14015e1e58090ed9c6", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.8848377799661243, "ground_truth": 0}, {"key": "12a24b1aba082a5fd0687a14015e1e58090ed9c6", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.8233284139162236, "ground_truth": 0}, {"key": "12a24b1aba082a5fd0687a14015e1e58090ed9c6", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.8322366512021685, "ground_truth": 0}, {"key": "12a24b1aba082a5fd0687a14015e1e58090ed9c6", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.7201715006282111, "ground_truth": 0}, {"key": "12a24b1aba082a5fd0687a14015e1e58090ed9c6", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.6242935381441304, "ground_truth": 0}, {"key": "c8ebf6f48257a704202c7b6df238bc1cbfa838d7", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.8056322064514472, "ground_truth": 0}, {"key": "c8ebf6f48257a704202c7b6df238bc1cbfa838d7", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.8697145819818212, "ground_truth": 0}, {"key": "c8ebf6f48257a704202c7b6df238bc1cbfa838d7", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.9161096112167557, "ground_truth": 0}, {"key": "c8ebf6f48257a704202c7b6df238bc1cbfa838d7", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.8705972676228528, "ground_truth": 0}, {"key": "c8ebf6f48257a704202c7b6df238bc1cbfa838d7", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.8509646982130247, "ground_truth": 0}, {"key": "48e858dcb8dd62aad328f2c5f7fa052893d7304b", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.7008948115910015, "ground_truth": 0}, {"key": "48e858dcb8dd62aad328f2c5f7fa052893d7304b", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.7981867859784164, "ground_truth": 0}, {"key": "48e858dcb8dd62aad328f2c5f7fa052893d7304b", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.6388352923417194, "ground_truth": 0}, {"key": "48e858dcb8dd62aad328f2c5f7fa052893d7304b", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.5602526577176103, "ground_truth": 0}, {"key": "48e858dcb8dd62aad328f2c5f7fa052893d7304b", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.8080672063001993, "ground_truth": 0}, {"key": "1522da440cb538c8fc60f254efcb65e8378065a1", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.9597620564376209, "ground_truth": 0}, {"key": "1522da440cb538c8fc60f254efcb65e8378065a1", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.9579122708890077, "ground_truth": 0}, {"key": "1522da440cb538c8fc60f254efcb65e8378065a1", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.9713473306396688, "ground_truth": 0}, {"key": "1522da440cb538c8fc60f254efcb65e8378065a1", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.9445872046297151, "ground_truth": 0}, {"key": "1522da440cb538c8fc60f254efcb65e8378065a1", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.8519528102771267, "ground_truth": 0}, {"key": "0b40c6061cfd6a745886150c46eb75a7f43b4efa", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.723309473054522, "ground_truth": 0}, {"key": "0b40c6061cfd6a745886150c46eb75a7f43b4efa", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.7853085626014428, "ground_truth": 0}, {"key": "0b40c6061cfd6a745886150c46eb75a7f43b4efa", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.8740772249975699, "ground_truth": 0}, {"key": "0b40c6061cfd6a745886150c46eb75a7f43b4efa", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.8732148261459182, "ground_truth": 0}, {"key": "0b40c6061cfd6a745886150c46eb75a7f43b4efa", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.7879311971648759, "ground_truth": 0}, {"key": "730655d5d1f29496344388805a891c3e3fd2a64e", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.8864204051627035, "ground_truth": 0}, {"key": "730655d5d1f29496344388805a891c3e3fd2a64e", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.7154239821774485, "ground_truth": 0}, {"key": "730655d5d1f29496344388805a891c3e3fd2a64e", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.845942447491843, "ground_truth": 0}, {"key": "730655d5d1f29496344388805a891c3e3fd2a64e", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.920217987960161, "ground_truth": 0}, {"key": "730655d5d1f29496344388805a891c3e3fd2a64e", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.9105453968683134, "ground_truth": 0}, {"key": "399877dd5e90d151e29ad67fdeb6fa093632e0e1", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.9053222950025732, "ground_truth": 0}, {"key": "399877dd5e90d151e29ad67fdeb6fa093632e0e1", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.8643104559167127, "ground_truth": 0}, {"key": "399877dd5e90d151e29ad67fdeb6fa093632e0e1", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.9059898151220014, "ground_truth": 0}, {"key": "399877dd5e90d151e29ad67fdeb6fa093632e0e1", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.7606506686233885, "ground_truth": 0}, {"key": "399877dd5e90d151e29ad67fdeb6fa093632e0e1", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.764891603523465, "ground_truth": 0}, {"key": "67fc9fa49a2c443dcbab030b9c6247a662716bc9", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.8519528098042248, "ground_truth": 0}, {"key": "67fc9fa49a2c443dcbab030b9c6247a662716bc9", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.8128673180921598, "ground_truth": 0}, {"key": "67fc9fa49a2c443dcbab030b9c6247a662716bc9", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.767689847426861, "ground_truth": 0}, {"key": "67fc9fa49a2c443dcbab030b9c6247a662716bc9", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.74908721887495, "ground_truth": 0}, {"key": "67fc9fa49a2c443dcbab030b9c6247a662716bc9", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.832236652878318, "ground_truth": 0}, {"key": "8a44f223fc67ed0d5f946517f77c2291d6c4a027", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.9059898169699967, "ground_truth": 0}, {"key": "8a44f223fc67ed0d5f946517f77c2291d6c4a027", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.9149009559031479, "ground_truth": 0}, {"key": "8a44f223fc67ed0d5f946517f77c2291d6c4a027", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.8006919824876466, "ground_truth": 0}, {"key": "8a44f223fc67ed0d5f946517f77c2291d6c4a027", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.9536217919387187, "ground_truth": 0}, {"key": "8a44f223fc67ed0d5f946517f77c2291d6c4a027", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.8918110338138205, "ground_truth": 0}, {"key": "a3906e4f27942e2742d5cc9a3241980e338e0d30", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.8365545899063374, "ground_truth": 0}, {"key": "a3906e4f27942e2742d5cc9a3241980e338e0d30", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.8587185904416457, "ground_truth": 0}, {"key": "a3906e4f27942e2742d5cc9a3241980e338e0d30", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.8902942197737034, "ground_truth": 0}, {"key": "a3906e4f27942e2742d5cc9a3241980e338e0d30", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.8080672066077452, "ground_truth": 0}, {"key": "a3906e4f27942e2742d5cc9a3241980e338e0d30", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.6859494514221869, "ground_truth": 0}, {"key": "1e9f089602e8ab42ae65e273d866b53bdf9501bc", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.9314625109856881, "ground_truth": 0}, {"key": "1e9f089602e8ab42ae65e273d866b53bdf9501bc", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.9026096055788988, "ground_truth": 0}, {"key": "1e9f089602e8ab42ae65e273d866b53bdf9501bc", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.8757869883180075, "ground_truth": 0}, {"key": "1e9f089602e8ab42ae65e273d866b53bdf9501bc", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.8679338526943844, "ground_truth": 0}, {"key": "1e9f089602e8ab42ae65e273d866b53bdf9501bc", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.9273632963852139, "ground_truth": 0}, {"key": "768682d2f556e103bad77ad7aaa0660181747d1c", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.7461389897338067, "ground_truth": 0}, {"key": "768682d2f556e103bad77ad7aaa0660181747d1c", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.7662936552413766, "ground_truth": 0}, {"key": "768682d2f556e103bad77ad7aaa0660181747d1c", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.887984036791321, "ground_truth": 0}, {"key": "768682d2f556e103bad77ad7aaa0660181747d1c", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.7866228340655561, "ground_truth": 0}, {"key": "768682d2f556e103bad77ad7aaa0660181747d1c", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.8428631466445468, "ground_truth": 0}, {"key": "2806f716e41ce224a3862eb2bc50e214bc5037d8", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.9515039987678792, "ground_truth": 0}, {"key": "2806f716e41ce224a3862eb2bc50e214bc5037d8", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.9372107959413785, "ground_truth": 0}, {"key": "2806f716e41ce224a3862eb2bc50e214bc5037d8", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.6513548703141208, "ground_truth": 0}, {"key": "2806f716e41ce224a3862eb2bc50e214bc5037d8", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.9420819124456286, "ground_truth": 0}, {"key": "2806f716e41ce224a3862eb2bc50e214bc5037d8", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.9637799425846859, "ground_truth": 0}, {"key": "49d1a193a2c477f5861b593f06681b35b0e49573", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.8740772289379093, "ground_truth": 0}, {"key": "49d1a193a2c477f5861b593f06681b35b0e49573", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.8365545561085846, "ground_truth": 0}, {"key": "49d1a193a2c477f5861b593f06681b35b0e49573", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.9184802465738018, "ground_truth": 0}, {"key": "49d1a193a2c477f5861b593f06681b35b0e49573", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.8615382158464908, "ground_truth": 0}, {"key": "49d1a193a2c477f5861b593f06681b35b0e49573", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.904650535621845, "ground_truth": 0}, {"key": "d603649af5260edbbe0474bcbb2e83e7340372d3", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.8807970800215287, "ground_truth": 0}, {"key": "d603649af5260edbbe0474bcbb2e83e7340372d3", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.8688267773089792, "ground_truth": 0}, {"key": "d603649af5260edbbe0474bcbb2e83e7340372d3", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.9504109760361539, "ground_truth": 0}, {"key": "d603649af5260edbbe0474bcbb2e83e7340372d3", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.9367494793021705, "ground_truth": 0}, {"key": "d603649af5260edbbe0474bcbb2e83e7340372d3", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.9142907200427633, "ground_truth": 0}, {"key": "241c3bfcde3e19fb8f0e5d0273ccb06155a2d86b", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.687629985324046, "ground_truth": 0}, {"key": "241c3bfcde3e19fb8f0e5d0273ccb06155a2d86b", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.5851011700935581, "ground_truth": 0}, {"key": "241c3bfcde3e19fb8f0e5d0273ccb06155a2d86b", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.7505527624310379, "ground_truth": 0}, {"key": "241c3bfcde3e19fb8f0e5d0273ccb06155a2d86b", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.7154239929079834, "ground_truth": 0}, {"key": "241c3bfcde3e19fb8f0e5d0273ccb06155a2d86b", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.7606506756804184, "ground_truth": 0}, {"key": "cc8898d831bb770da703c284d4a811f16cb4035b", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.658417490485124, "ground_truth": 0}, {"key": "cc8898d831bb770da703c284d4a811f16cb4035b", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.6943026806904141, "ground_truth": 0}, {"key": "cc8898d831bb770da703c284d4a811f16cb4035b", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.6842640316599443, "ground_truth": 0}, {"key": "cc8898d831bb770da703c284d4a811f16cb4035b", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.6959583013027054, "ground_truth": 0}, {"key": "cc8898d831bb770da703c284d4a811f16cb4035b", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.7549150024352171, "ground_truth": 0}, {"key": "e5685719d330bf84ed7691a9a591e04e6a6226b8", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.8428631490221108, "ground_truth": 0}, {"key": "e5685719d330bf84ed7691a9a591e04e6a6226b8", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.8006920128989379, "ground_truth": 0}, {"key": "e5685719d330bf84ed7691a9a591e04e6a6226b8", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.8289388241861737, "ground_truth": 0}, {"key": "e5685719d330bf84ed7691a9a591e04e6a6226b8", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.7592254159349766, "ground_truth": 0}, {"key": "e5685719d330bf84ed7691a9a591e04e6a6226b8", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.9394706151450183, "ground_truth": 0}, {"key": "bc868bcd37d2463875c4c685c582449069992a76", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.8333245991473848, "ground_truth": 0}, {"key": "bc868bcd37d2463875c4c685c582449069992a76", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.8539127585796656, "ground_truth": 0}, {"key": "bc868bcd37d2463875c4c685c582449069992a76", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.7138307481212045, "ground_truth": 0}, {"key": "bc868bcd37d2463875c4c685c582449069992a76", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.6825737149212128, "ground_truth": 0}, {"key": "bc868bcd37d2463875c4c685c582449069992a76", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.6706082911932848, "ground_truth": 0}, {"key": "c6369011986d295ce197e7304e14b207dab4c0aa", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.7279754359293273, "ground_truth": 0}, {"key": "c6369011986d295ce197e7304e14b207dab4c0aa", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.7772998594995688, "ground_truth": 0}, {"key": "c6369011986d295ce197e7304e14b207dab4c0aa", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.9207896828290736, "ground_truth": 0}, {"key": "c6369011986d295ce197e7304e14b207dab4c0aa", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.746138999198902, "ground_truth": 0}, {"key": "c6369011986d295ce197e7304e14b207dab4c0aa", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.8438951068138034, "ground_truth": 0}, {"key": "c4e4f565d15f76b1e367d4fc2e7a2648c3cd395c", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.47463116196602884, "ground_truth": 0}, {"key": "c4e4f565d15f76b1e367d4fc2e7a2648c3cd395c", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.8187367928213298, "ground_truth": 0}, {"key": "c4e4f565d15f76b1e367d4fc2e7a2648c3cd395c", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.5888891279361435, "ground_truth": 0}, {"key": "c4e4f565d15f76b1e367d4fc2e7a2648c3cd395c", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.537041406846985, "ground_truth": 0}, {"key": "c4e4f565d15f76b1e367d4fc2e7a2648c3cd395c", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.6893056151539722, "ground_truth": 0}, {"key": "32fe9f0f2eedaf63c9fd0314ab92c4b46297e260", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.5794003916645043, "ground_truth": 0}, {"key": "32fe9f0f2eedaf63c9fd0314ab92c4b46297e260", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.8019358233657315, "ground_truth": 0}, {"key": "32fe9f0f2eedaf63c9fd0314ab92c4b46297e260", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.7759445396926686, "ground_truth": 0}, {"key": "32fe9f0f2eedaf63c9fd0314ab92c4b46297e260", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.6825737097834065, "ground_truth": 0}, {"key": "32fe9f0f2eedaf63c9fd0314ab92c4b46297e260", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.7401743527519341, "ground_truth": 0}, {"key": "41698f361bcf6415f711719ed0c2f6817205c091", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.942928597623261, "ground_truth": 0}, {"key": "41698f361bcf6415f711719ed0c2f6817205c091", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.9118099580295138, "ground_truth": 0}, {"key": "41698f361bcf6415f711719ed0c2f6817205c091", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.8984105492245357, "ground_truth": 0}, {"key": "41698f361bcf6415f711719ed0c2f6817205c091", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.9207896806550239, "ground_truth": 0}, {"key": "41698f361bcf6415f711719ed0c2f6817205c091", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.8221891172689755, "ground_truth": 0}, {"key": "f040d657ee146cd131d34aeb31d6728b4f996666", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.8300437627633134, "ground_truth": 0}, {"key": "f040d657ee146cd131d34aeb31d6728b4f996666", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.7577943700498688, "ground_truth": 0}, {"key": "f040d657ee146cd131d34aeb31d6728b4f996666", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.863391602762848, "ground_truth": 0}, {"key": "f040d657ee146cd131d34aeb31d6728b4f996666", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.8879840396249569, "ground_truth": 0}, {"key": "f040d657ee146cd131d34aeb31d6728b4f996666", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.8080672071099073, "ground_truth": 0}, {"key": "1823e1e750046606e4be0e8710f1d74998783e41", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.8824278689382515, "ground_truth": 0}, {"key": "1823e1e750046606e4be0e8710f1d74998783e41", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.8998277710681482, "ground_truth": 0}, {"key": "1823e1e750046606e4be0e8710f1d74998783e41", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.9086178914520924, "ground_truth": 0}, {"key": "1823e1e750046606e4be0e8710f1d74998783e41", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.8910549444344252, "ground_truth": 0}, {"key": "1823e1e750046606e4be0e8710f1d74998783e41", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.9136765210199842, "ground_truth": 0}, {"key": "6fae638166ee95509fbab3b28ac1c0ba0b088c79", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.766293645902429, "ground_truth": 0}, {"key": "6fae638166ee95509fbab3b28ac1c0ba0b088c79", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.6150878329048718, "ground_truth": 0}, {"key": "6fae638166ee95509fbab3b28ac1c0ba0b088c79", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.6791787042486799, "ground_truth": 0}, {"key": "6fae638166ee95509fbab3b28ac1c0ba0b088c79", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.767689842352143, "ground_truth": 0}, {"key": "6fae638166ee95509fbab3b28ac1c0ba0b088c79", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.7154239944589237, "ground_truth": 0}, {"key": "00be40289d0aea65afd2da6431db8a9fc8efc9c0", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.88403928022607, "ground_truth": 0}, {"key": "00be40289d0aea65afd2da6431db8a9fc8efc9c0", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.9136765166665146, "ground_truth": 0}, {"key": "00be40289d0aea65afd2da6431db8a9fc8efc9c0", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.7994423128717834, "ground_truth": 0}, {"key": "00be40289d0aea65afd2da6431db8a9fc8efc9c0", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.8428631370200096, "ground_truth": 0}, {"key": "00be40289d0aea65afd2da6431db8a9fc8efc9c0", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.759225402303875, "ground_truth": 0}, {"key": "50dc0ca6cbbd4f9c3761fbb3ad9e7d7ba85bd9b3", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.7505527618426007, "ground_truth": 0}, {"key": "50dc0ca6cbbd4f9c3761fbb3ad9e7d7ba85bd9b3", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.873214824644255, "ground_truth": 0}, {"key": "50dc0ca6cbbd4f9c3761fbb3ad9e7d7ba85bd9b3", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.8479677539300183, "ground_truth": 0}, {"key": "50dc0ca6cbbd4f9c3761fbb3ad9e7d7ba85bd9b3", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.8895288489290379, "ground_truth": 0}, {"key": "50dc0ca6cbbd4f9c3761fbb3ad9e7d7ba85bd9b3", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.8428631504180634, "ground_truth": 0}, {"key": "28b0e5240a7c3088fc62a70628b146bb40b6b853", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.9713473312911924, "ground_truth": 0}, {"key": "28b0e5240a7c3088fc62a70628b146bb40b6b853", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.9445872074671455, "ground_truth": 0}, {"key": "28b0e5240a7c3088fc62a70628b146bb40b6b853", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.9334308109805107, "ground_truth": 0}, {"key": "28b0e5240a7c3088fc62a70628b146bb40b6b853", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.9645892727126745, "ground_truth": 0}, {"key": "28b0e5240a7c3088fc62a70628b146bb40b6b853", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.9559813469064801, "ground_truth": 0}, {"key": "44bdf9aa9712197110017fca533785653210f1ea", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.6976089197677691, "ground_truth": 0}, {"key": "44bdf9aa9712197110017fca533785653210f1ea", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.9202179833441073, "ground_truth": 0}, {"key": "44bdf9aa9712197110017fca533785653210f1ea", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.8624675268528325, "ground_truth": 0}, {"key": "44bdf9aa9712197110017fca533785653210f1ea", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.9202179856214588, "ground_truth": 0}, {"key": "44bdf9aa9712197110017fca533785653210f1ea", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.8499711797860219, "ground_truth": 0}, {"key": "879e68a2b78b3cf3f5c2581bbf6093871143ed7b", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.8947894708871824, "ground_truth": 0}, {"key": "879e68a2b78b3cf3f5c2581bbf6093871143ed7b", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.8962513780894417, "ground_truth": 0}, {"key": "879e68a2b78b3cf3f5c2581bbf6093871143ed7b", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.8519528198012701, "ground_truth": 0}, {"key": "879e68a2b78b3cf3f5c2581bbf6093871143ed7b", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.8840392786972183, "ground_truth": 0}, {"key": "879e68a2b78b3cf3f5c2581bbf6093871143ed7b", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.9073122225002199, "ground_truth": 0}, {"key": "980051ddbf137ec06e7aeead2acb598bae388520", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.8469578570019706, "ground_truth": 0}, {"key": "980051ddbf137ec06e7aeead2acb598bae388520", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.9073122219249181, "ground_truth": 0}, {"key": "980051ddbf137ec06e7aeead2acb598bae388520", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.8233284137509762, "ground_truth": 0}, {"key": "980051ddbf137ec06e7aeead2acb598bae388520", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.8643104506539376, "ground_truth": 0}, {"key": "980051ddbf137ec06e7aeead2acb598bae388520", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.9178933701323176, "ground_truth": 0}, {"key": "45b9fb89ac2724f2d7de56b2f8c9397bca03326e", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.9299510339445334, "ground_truth": 0}, {"key": "45b9fb89ac2724f2d7de56b2f8c9397bca03326e", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.8068526147395403, "ground_truth": 0}, {"key": "45b9fb89ac2724f2d7de56b2f8c9397bca03326e", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.8519528198317662, "ground_truth": 0}, {"key": "45b9fb89ac2724f2d7de56b2f8c9397bca03326e", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.8068526177725698, "ground_truth": 0}, {"key": "45b9fb89ac2724f2d7de56b2f8c9397bca03326e", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.8140527965110445, "ground_truth": 0}, {"key": "b427165e1be5e9b6e6067fc5f6591c02bfb93333", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.8615382009856285, "ground_truth": 0}, {"key": "b427165e1be5e9b6e6067fc5f6591c02bfb93333", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.839733968164469, "ground_truth": 0}, {"key": "b427165e1be5e9b6e6067fc5f6591c02bfb93333", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.8300437716546555, "ground_truth": 0}, {"key": "b427165e1be5e9b6e6067fc5f6591c02bfb93333", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.867933858029854, "ground_truth": 0}, {"key": "b427165e1be5e9b6e6067fc5f6591c02bfb93333", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.8175744762389359, "ground_truth": 0}, {"key": "a9a2880bd65c6b3835d19987ebcbd3d09010a0c3", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.600188355641534, "ground_truth": 0}, {"key": "a9a2880bd65c6b3835d19987ebcbd3d09010a0c3", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.7648916119591376, "ground_truth": 0}, {"key": "a9a2880bd65c6b3835d19987ebcbd3d09010a0c3", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.7918210681753558, "ground_truth": 0}, {"key": "a9a2880bd65c6b3835d19987ebcbd3d09010a0c3", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.7008948049913363, "ground_truth": 0}, {"key": "a9a2880bd65c6b3835d19987ebcbd3d09010a0c3", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.8019358334513943, "ground_truth": 0}, {"key": "0c67e8d5a91f3c7d9c53e29b8d0a25cf8db21b54", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.8289388135365312, "ground_truth": 0}, {"key": "0c67e8d5a91f3c7d9c53e29b8d0a25cf8db21b54", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.887984046970943, "ground_truth": 0}, {"key": "0c67e8d5a91f3c7d9c53e29b8d0a25cf8db21b54", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.8606036150679978, "ground_truth": 0}, {"key": "0c67e8d5a91f3c7d9c53e29b8d0a25cf8db21b54", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.8539127457538401, "ground_truth": 0}, {"key": "0c67e8d5a91f3c7d9c53e29b8d0a25cf8db21b54", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.8774767893106331, "ground_truth": 0}, {"key": "bc1c4d12aabdcecab3d87c6f9a898e41c7cd3821", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.9664104932058248, "ground_truth": 0}, {"key": "bc1c4d12aabdcecab3d87c6f9a898e41c7cd3821", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.9367494791997125, "ground_truth": 0}, {"key": "bc1c4d12aabdcecab3d87c6f9a898e41c7cd3821", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.9732407155217295, "ground_truth": 0}, {"key": "bc1c4d12aabdcecab3d87c6f9a898e41c7cd3821", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.970464660818447, "ground_truth": 0}, {"key": "bc1c4d12aabdcecab3d87c6f9a898e41c7cd3821", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.9053222975978206, "ground_truth": 0}, {"key": "7b76a0b5e6006587b65ad70ac2e4953ca1e2d4d1", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.8255897148495572, "ground_truth": 0}, {"key": "7b76a0b5e6006587b65ad70ac2e4953ca1e2d4d1", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.805632171110322, "ground_truth": 0}, {"key": "7b76a0b5e6006587b65ad70ac2e4953ca1e2d4d1", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.7606506409866315, "ground_truth": 0}, {"key": "7b76a0b5e6006587b65ad70ac2e4953ca1e2d4d1", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.7520125857923934, "ground_truth": 0}, {"key": "7b76a0b5e6006587b65ad70ac2e4953ca1e2d4d1", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.63703076847487, "ground_truth": 0}, {"key": "8a0976b5b0811c919669e8aed7274e1d0fa14679", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.7577943570675416, "ground_truth": 0}, {"key": "8a0976b5b0811c919669e8aed7274e1d0fa14679", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.7704647962085145, "ground_truth": 0}, {"key": "8a0976b5b0811c919669e8aed7274e1d0fa14679", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.8267117911218439, "ground_truth": 0}, {"key": "8a0976b5b0811c919669e8aed7274e1d0fa14679", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.7386690695483674, "ground_truth": 0}, {"key": "8a0976b5b0811c919669e8aed7274e1d0fa14679", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.8407825992024016, "ground_truth": 0}, {"key": "69788d586d71bf36d2818ca097308747f6ab25ab", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.7931059554523008, "ground_truth": 0}, {"key": "69788d586d71bf36d2818ca097308747f6ab25ab", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.8832359904184487, "ground_truth": 0}, {"key": "69788d586d71bf36d2818ca097308747f6ab25ab", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.8832359885977838, "ground_truth": 0}, {"key": "69788d586d71bf36d2818ca097308747f6ab25ab", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.8255897149196113, "ground_truth": 0}, {"key": "69788d586d71bf36d2818ca097308747f6ab25ab", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.8688267742507099, "ground_truth": 0}, {"key": "82e9c77478dfed129ceca1a152ba54e20f7f5a88", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.8152324912962944, "ground_truth": 0}, {"key": "82e9c77478dfed129ceca1a152ba54e20f7f5a88", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.8661325097629528, "ground_truth": 0}, {"key": "82e9c77478dfed129ceca1a152ba54e20f7f5a88", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.8832359830145219, "ground_truth": 0}, {"key": "82e9c77478dfed129ceca1a152ba54e20f7f5a88", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.796925368235359, "ground_truth": 0}, {"key": "82e9c77478dfed129ceca1a152ba54e20f7f5a88", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.8548846406952586, "ground_truth": 0}, {"key": "e1b904fd0a3f74c3e01831acb6d4a67c0d1b642b", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.866132508674646, "ground_truth": 0}, {"key": "e1b904fd0a3f74c3e01831acb6d4a67c0d1b642b", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.8255897301381456, "ground_truth": 0}, {"key": "e1b904fd0a3f74c3e01831acb6d4a67c0d1b642b", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.8116760178095542, "ground_truth": 0}, {"key": "e1b904fd0a3f74c3e01831acb6d4a67c0d1b642b", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.7057850250651584, "ground_truth": 0}, {"key": "e1b904fd0a3f74c3e01831acb6d4a67c0d1b642b", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.8479677584761335, "ground_truth": 0}, {"key": "1cecb5f24805afcc15eb5cfa0500130f107c8bcb", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.6893056040492145, "ground_truth": 0}, {"key": "1cecb5f24805afcc15eb5cfa0500130f107c8bcb", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.8596637526640878, "ground_truth": 0}, {"key": "1cecb5f24805afcc15eb5cfa0500130f107c8bcb", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.8080672064231456, "ground_truth": 0}, {"key": "1cecb5f24805afcc15eb5cfa0500130f107c8bcb", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.8152324945699733, "ground_truth": 0}, {"key": "1cecb5f24805afcc15eb5cfa0500130f107c8bcb", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.8714748567181901, "ground_truth": 0}, {"key": "d3da69405b687367de6260d74db8726423b6884a", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.8895288545670625, "ground_truth": 0}, {"key": "d3da69405b687367de6260d74db8726423b6884a", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.9005297945385611, "ground_truth": 0}, {"key": "d3da69405b687367de6260d74db8726423b6884a", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.7786493157981127, "ground_truth": 0}, {"key": "d3da69405b687367de6260d74db8726423b6884a", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.838679758911754, "ground_truth": 0}, {"key": "d3da69405b687367de6260d74db8726423b6884a", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.9334308112018347, "ground_truth": 0}, {"key": "9b7836ba179053fecec671168589694bd4ba08f1", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.926303728617732, "ground_truth": 0}, {"key": "9b7836ba179053fecec671168589694bd4ba08f1", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.9339146272260433, "ground_truth": 0}, {"key": "9b7836ba179053fecec671168589694bd4ba08f1", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.9690910394194032, "ground_truth": 0}, {"key": "9b7836ba179053fecec671168589694bd4ba08f1", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.9390248181619432, "ground_truth": 0}, {"key": "9b7836ba179053fecec671168589694bd4ba08f1", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.9477691423977029, "ground_truth": 0}, {"key": "9483ae6d83dd71a96e91eee727a9ce7c0f3cf6ab", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.9838471655570045, "ground_truth": 0}, {"key": "9483ae6d83dd71a96e91eee727a9ce7c0f3cf6ab", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.976669232919418, "ground_truth": 0}, {"key": "9483ae6d83dd71a96e91eee727a9ce7c0f3cf6ab", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.9843363517131669, "ground_truth": 0}, {"key": "9483ae6d83dd71a96e91eee727a9ce7c0f3cf6ab", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.9778834105444476, "ground_truth": 0}, {"key": "9483ae6d83dd71a96e91eee727a9ce7c0f3cf6ab", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.9734434270155022, "ground_truth": 0}, {"key": "ea29e498c303964fc39c856ddf7037d5dfbc93fb", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.8558511469935784, "ground_truth": 0}, {"key": "ea29e498c303964fc39c856ddf7037d5dfbc93fb", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.9155072461569338, "ground_truth": 0}, {"key": "ea29e498c303964fc39c856ddf7037d5dfbc93fb", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.8714748649214098, "ground_truth": 0}, {"key": "ea29e498c303964fc39c856ddf7037d5dfbc93fb", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.78133063934579, "ground_truth": 0}, {"key": "ea29e498c303964fc39c856ddf7037d5dfbc93fb", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.9324533039756742, "ground_truth": 0}, {"key": "e1aad9da59a32a4443010b092eba1b68725c8467", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.8661325055191003, "ground_truth": 0}, {"key": "e1aad9da59a32a4443010b092eba1b68725c8467", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.7969253440366374, "ground_truth": 0}, {"key": "e1aad9da59a32a4443010b092eba1b68725c8467", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.7356416338452668, "ground_truth": 0}, {"key": "e1aad9da59a32a4443010b092eba1b68725c8467", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.8459424467876412, "ground_truth": 0}, {"key": "e1aad9da59a32a4443010b092eba1b68725c8467", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.7041601487843815, "ground_truth": 0}, {"key": "6897f34c8e510dc95524dbfceefe20717776f761", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.7264256091597306, "ground_truth": 0}, {"key": "6897f34c8e510dc95524dbfceefe20717776f761", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.7549149899135801, "ground_truth": 0}, {"key": "6897f34c8e510dc95524dbfceefe20717776f761", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.5234203434044123, "ground_truth": 0}, {"key": "6897f34c8e510dc95524dbfceefe20717776f761", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.8479677532531626, "ground_truth": 0}, {"key": "6897f34c8e510dc95524dbfceefe20717776f761", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.8407826030943527, "ground_truth": 0}, {"key": "c0846f0148c9fd60433c8d2bf85e3437b49f9ec4", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.8152324939123463, "ground_truth": 0}, {"key": "c0846f0148c9fd60433c8d2bf85e3437b49f9ec4", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.7931059556912476, "ground_truth": 0}, {"key": "c0846f0148c9fd60433c8d2bf85e3437b49f9ec4", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.8333245979577752, "ground_truth": 0}, {"key": "c0846f0148c9fd60433c8d2bf85e3437b49f9ec4", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.8267117885835833, "ground_truth": 0}, {"key": "c0846f0148c9fd60433c8d2bf85e3437b49f9ec4", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.7577943661821399, "ground_truth": 0}, {"key": "dfbb5a2d5844f89537141a2b5a48040e68327010", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.7431679997740013, "ground_truth": 0}, {"key": "dfbb5a2d5844f89537141a2b5a48040e68327010", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.817574476888594, "ground_truth": 0}, {"key": "dfbb5a2d5844f89537141a2b5a48040e68327010", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.7386690709550231, "ground_truth": 0}, {"key": "dfbb5a2d5844f89537141a2b5a48040e68327010", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.8469578441199229, "ground_truth": 0}, {"key": "dfbb5a2d5844f89537141a2b5a48040e68327010", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.8322366566264656, "ground_truth": 0}, {"key": "0aa0562353120d93357dc00a05ff4d2bc0312715", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.7634837612199554, "ground_truth": 0}, {"key": "0aa0562353120d93357dc00a05ff4d2bc0312715", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.7170118663424929, "ground_truth": 0}, {"key": "0aa0562353120d93357dc00a05ff4d2bc0312715", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.7718435000523265, "ground_truth": 0}, {"key": "0aa0562353120d93357dc00a05ff4d2bc0312715", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.8670357631530147, "ground_truth": 0}, {"key": "0aa0562353120d93357dc00a05ff4d2bc0312715", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.8354835474200487, "ground_truth": 0}, {"key": "fd5ae29a3ed2e9093c12dcbb12fcb5c67217b0f5", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.837619972438842, "ground_truth": 0}, {"key": "fd5ae29a3ed2e9093c12dcbb12fcb5c67217b0f5", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.8469578518152557, "ground_truth": 0}, {"key": "fd5ae29a3ed2e9093c12dcbb12fcb5c67217b0f5", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.8670357515773989, "ground_truth": 0}, {"key": "fd5ae29a3ed2e9093c12dcbb12fcb5c67217b0f5", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.804405920398129, "ground_truth": 0}, {"key": "fd5ae29a3ed2e9093c12dcbb12fcb5c67217b0f5", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.8092759747647857, "ground_truth": 0}, {"key": "4df7a53f5e24347a53d5bf3b8c92bef21561f2c4", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.7008948150791393, "ground_truth": 0}, {"key": "4df7a53f5e24347a53d5bf3b8c92bef21561f2c4", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.8633916132746537, "ground_truth": 0}, {"key": "4df7a53f5e24347a53d5bf3b8c92bef21561f2c4", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.8428631440393172, "ground_truth": 0}, {"key": "4df7a53f5e24347a53d5bf3b8c92bef21561f2c4", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.8643104559471403, "ground_truth": 0}, {"key": "4df7a53f5e24347a53d5bf3b8c92bef21561f2c4", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.8092759709544658, "ground_truth": 0}, {"key": "166fe0c3d3f400a48ec5fd716c675384512f152c", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.8221891207164342, "ground_truth": 0}, {"key": "166fe0c3d3f400a48ec5fd716c675384512f152c", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.8044059347626533, "ground_truth": 0}, {"key": "166fe0c3d3f400a48ec5fd716c675384512f152c", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.7431679959367616, "ground_truth": 0}, {"key": "166fe0c3d3f400a48ec5fd716c675384512f152c", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.886420412119378, "ground_truth": 0}, {"key": "166fe0c3d3f400a48ec5fd716c675384512f152c", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.8104789099810445, "ground_truth": 0}, {"key": "69e313e0e6e7603f96a3783cb7d1ada68ace288f", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.8962513720660974, "ground_truth": 0}, {"key": "69e313e0e6e7603f96a3783cb7d1ada68ace288f", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.8344068881131048, "ground_truth": 0}, {"key": "69e313e0e6e7603f96a3783cb7d1ada68ace288f", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.8289388041081673, "ground_truth": 0}, {"key": "69e313e0e6e7603f96a3783cb7d1ada68ace288f", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.8840392866670621, "ground_truth": 0}, {"key": "69e313e0e6e7603f96a3783cb7d1ada68ace288f", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.7905303294232284, "ground_truth": 0}, {"key": "21ff7b91537b3ab2e73dff1f982a669b8658b0e9", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.7185943916954649, "ground_truth": 0}, {"key": "21ff7b91537b3ab2e73dff1f982a669b8658b0e9", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.6959583460932632, "ground_truth": 0}, {"key": "21ff7b91537b3ab2e73dff1f982a669b8658b0e9", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.9268352844876366, "ground_truth": 0}, {"key": "21ff7b91537b3ab2e73dff1f982a669b8658b0e9", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.8548846280178939, "ground_truth": 0}, {"key": "21ff7b91537b3ab2e73dff1f982a669b8658b0e9", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.8697145665561371, "ground_truth": 0}, {"key": "963cbc7820b42eaa7b7a82d178c6a387a70a6a3c", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.8740772288083208, "ground_truth": 0}, {"key": "963cbc7820b42eaa7b7a82d178c6a387a70a6a3c", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.8019358124356765, "ground_truth": 0}, {"key": "963cbc7820b42eaa7b7a82d178c6a387a70a6a3c", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.8322366441555463, "ground_truth": 0}, {"key": "963cbc7820b42eaa7b7a82d178c6a387a70a6a3c", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.896251381889733, "ground_truth": 0}, {"key": "963cbc7820b42eaa7b7a82d178c6a387a70a6a3c", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.8633916160023176, "ground_truth": 0}, {"key": "8180a77657661e975e3fac6c7fdbd8de97fd160e", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.9744347870775458, "ground_truth": 0}, {"key": "8180a77657661e975e3fac6c7fdbd8de97fd160e", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.9858276341524301, "ground_truth": 0}, {"key": "8180a77657661e975e3fac6c7fdbd8de97fd160e", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.966155968510476, "ground_truth": 0}, {"key": "8180a77657661e975e3fac6c7fdbd8de97fd160e", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.9793540687938124, "ground_truth": 0}, {"key": "8180a77657661e975e3fac6c7fdbd8de97fd160e", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.9748211556709955, "ground_truth": 0}, {"key": "6c498fd6de7ad5e5006732655050c1d97cc2af68", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.874934615221676, "ground_truth": 0}, {"key": "6c498fd6de7ad5e5006732655050c1d97cc2af68", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.8783142513979629, "ground_truth": 0}, {"key": "6c498fd6de7ad5e5006732655050c1d97cc2af68", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.8902942356750733, "ground_truth": 0}, {"key": "6c498fd6de7ad5e5006732655050c1d97cc2af68", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.9079671391683669, "ground_truth": 0}, {"key": "6c498fd6de7ad5e5006732655050c1d97cc2af68", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.86793384543106, "ground_truth": 0}, {"key": "fdb54e157f8f4e5a479dbc6288587e52fffde33f", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.7648916201668736, "ground_truth": 0}, {"key": "fdb54e157f8f4e5a479dbc6288587e52fffde33f", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.8365545660670544, "ground_truth": 0}, {"key": "fdb54e157f8f4e5a479dbc6288587e52fffde33f", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.8300437577805795, "ground_truth": 0}, {"key": "fdb54e157f8f4e5a479dbc6288587e52fffde33f", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.8558511420913437, "ground_truth": 0}, {"key": "fdb54e157f8f4e5a479dbc6288587e52fffde33f", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.8289388134463801, "ground_truth": 0}, {"key": "fc8f0e54e2627ebe705735f0565d77ca64579d92", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.8925625343271255, "ground_truth": 0}, {"key": "fc8f0e54e2627ebe705735f0565d77ca64579d92", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.7620701047180533, "ground_truth": 0}, {"key": "fc8f0e54e2627ebe705735f0565d77ca64579d92", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.7592253902327445, "ground_truth": 0}, {"key": "fc8f0e54e2627ebe705735f0565d77ca64579d92", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.8902942287327257, "ground_truth": 0}, {"key": "fc8f0e54e2627ebe705735f0565d77ca64579d92", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.8407825870185297, "ground_truth": 0}, {"key": "b000d4eac990440e136dc1e655a03d5669531d9b", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.8418256456880807, "ground_truth": 0}, {"key": "b000d4eac990440e136dc1e655a03d5669531d9b", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.6388352679434334, "ground_truth": 0}, {"key": "b000d4eac990440e136dc1e655a03d5669531d9b", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.9086178931969461, "ground_truth": 0}, {"key": "b000d4eac990440e136dc1e655a03d5669531d9b", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.8449215304135861, "ground_truth": 0}, {"key": "b000d4eac990440e136dc1e655a03d5669531d9b", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.9161096137411802, "ground_truth": 0}, {"key": "1064c47f3d7f0efa03368fe7eb01dd0836017339", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.8925625249126439, "ground_truth": 0}, {"key": "1064c47f3d7f0efa03368fe7eb01dd0836017339", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.8714748631389652, "ground_truth": 0}, {"key": "1064c47f3d7f0efa03368fe7eb01dd0836017339", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.7704647983127436, "ground_truth": 0}, {"key": "1064c47f3d7f0efa03368fe7eb01dd0836017339", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.8354835461422119, "ground_truth": 0}, {"key": "1064c47f3d7f0efa03368fe7eb01dd0836017339", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.8175744633675501, "ground_truth": 0}, {"key": "d79f1e9a2ddfcb61d80c944de53daebd4b5c7f6e", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.8116760081533758, "ground_truth": 0}, {"key": "d79f1e9a2ddfcb61d80c944de53daebd4b5c7f6e", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.7866228357884513, "ground_truth": 0}, {"key": "d79f1e9a2ddfcb61d80c944de53daebd4b5c7f6e", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.7154240042431953, "ground_truth": 0}, {"key": "d79f1e9a2ddfcb61d80c944de53daebd4b5c7f6e", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.5563995911762398, "ground_truth": 0}, {"key": "d79f1e9a2ddfcb61d80c944de53daebd4b5c7f6e", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.8128673148566187, "ground_truth": 0}, {"key": "87b5f1f872c849ec239bad4ccf487d048d4274b2", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.8984105497635977, "ground_truth": 0}, {"key": "87b5f1f872c849ec239bad4ccf487d048d4274b2", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.9372107917145271, "ground_truth": 0}, {"key": "87b5f1f872c849ec239bad4ccf487d048d4274b2", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.93902481745751, "ground_truth": 0}, {"key": "87b5f1f872c849ec239bad4ccf487d048d4274b2", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.8587185797572299, "ground_truth": 0}, {"key": "87b5f1f872c849ec239bad4ccf487d048d4274b2", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.9161096103480177, "ground_truth": 0}, {"key": "9ea6d6a5cae86243c1c8899f7bab76e874c73b38", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.7853085786666205, "ground_truth": 0}, {"key": "9ea6d6a5cae86243c1c8899f7bab76e874c73b38", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.5467381555498536, "ground_truth": 0}, {"key": "9ea6d6a5cae86243c1c8899f7bab76e874c73b38", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.7520125589208199, "ground_truth": 0}, {"key": "9ea6d6a5cae86243c1c8899f7bab76e874c73b38", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.7662936572511495, "ground_truth": 0}, {"key": "9ea6d6a5cae86243c1c8899f7bab76e874c73b38", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.840782602229185, "ground_truth": 0}, {"key": "a3cb529364dbdcd2af9e30ecfe56898be375870b", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.8175744665269583, "ground_truth": 0}, {"key": "a3cb529364dbdcd2af9e30ecfe56898be375870b", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.8740772295705668, "ground_truth": 0}, {"key": "a3cb529364dbdcd2af9e30ecfe56898be375870b", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.8848377661733141, "ground_truth": 0}, {"key": "a3cb529364dbdcd2af9e30ecfe56898be375870b", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.7461389814614189, "ground_truth": 0}, {"key": "a3cb529364dbdcd2af9e30ecfe56898be375870b", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.8910549635780399, "ground_truth": 0}, {"key": "f489b07406c653968a0ed21c00e28c9124e4a49b", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.8187367935979188, "ground_truth": 0}, {"key": "f489b07406c653968a0ed21c00e28c9124e4a49b", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.8499711755087599, "ground_truth": 0}, {"key": "f489b07406c653968a0ed21c00e28c9124e4a49b", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.9073122268499674, "ground_truth": 0}, {"key": "f489b07406c653968a0ed21c00e28c9124e4a49b", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.8902942288226487, "ground_truth": 0}, {"key": "f489b07406c653968a0ed21c00e28c9124e4a49b", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.8539127587753521, "ground_truth": 0}, {"key": "499fdb9bf024f6fbfd605792594372df22ec12f0", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.6169358242933783, "ground_truth": 0}, {"key": "499fdb9bf024f6fbfd605792594372df22ec12f0", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.7401743519761174, "ground_truth": 0}, {"key": "499fdb9bf024f6fbfd605792594372df22ec12f0", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.8376199745367646, "ground_truth": 0}, {"key": "499fdb9bf024f6fbfd605792594372df22ec12f0", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.7549149955357229, "ground_truth": 0}, {"key": "499fdb9bf024f6fbfd605792594372df22ec12f0", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.5794004176490605, "ground_truth": 0}, {"key": "9f49bf7ded4308f1601e4723d594d7c3b4883b32", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.8723473734454844, "ground_truth": 0}, {"key": "9f49bf7ded4308f1601e4723d594d7c3b4883b32", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.9190632844876189, "ground_truth": 0}, {"key": "9f49bf7ded4308f1601e4723d594d7c3b4883b32", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.8872045855702816, "ground_truth": 0}, {"key": "9f49bf7ded4308f1601e4723d594d7c3b4883b32", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.8539127574749422, "ground_truth": 0}, {"key": "9f49bf7ded4308f1601e4723d594d7c3b4883b32", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.9304582537623405, "ground_truth": 0}, {"key": "6bd843fe975d42b0f2d5eedb1a02d918e4a397f5", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.8902942249811745, "ground_truth": 0}, {"key": "6bd843fe975d42b0f2d5eedb1a02d918e4a397f5", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.8766343801071825, "ground_truth": 0}, {"key": "6bd843fe975d42b0f2d5eedb1a02d918e4a397f5", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.8278281509637982, "ground_truth": 0}, {"key": "6bd843fe975d42b0f2d5eedb1a02d918e4a397f5", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.8955226735075971, "ground_truth": 0}, {"key": "6bd843fe975d42b0f2d5eedb1a02d918e4a397f5", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.8267117919651347, "ground_truth": 0}, {"key": "00aa8e3ba59f5fe71a096a5549f80faece10aa83", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.8418256648031122, "ground_truth": 0}, {"key": "00aa8e3ba59f5fe71a096a5549f80faece10aa83", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.8548846297759115, "ground_truth": 0}, {"key": "00aa8e3ba59f5fe71a096a5549f80faece10aa83", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.8661325077520843, "ground_truth": 0}, {"key": "00aa8e3ba59f5fe71a096a5549f80faece10aa83", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.771843482879399, "ground_truth": 0}, {"key": "00aa8e3ba59f5fe71a096a5549f80faece10aa83", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.7718434855865727, "ground_truth": 0}, {"key": "bf0ea0373655184f69fb01b9aa833d21e7188e9e", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.7106282890738665, "ground_truth": 0}, {"key": "bf0ea0373655184f69fb01b9aa833d21e7188e9e", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.8633916086866766, "ground_truth": 0}, {"key": "bf0ea0373655184f69fb01b9aa833d21e7188e9e", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.866132502072466, "ground_truth": 0}, {"key": "bf0ea0373655184f69fb01b9aa833d21e7188e9e", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.7718434901767649, "ground_truth": 0}, {"key": "bf0ea0373655184f69fb01b9aa833d21e7188e9e", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.7041601349456865, "ground_truth": 0}, {"key": "e1afe080ecf3565b0103214c21f49e8b03741024", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.6424324564378823, "ground_truth": 0}, {"key": "e1afe080ecf3565b0103214c21f49e8b03741024", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.8354835522931063, "ground_truth": 0}, {"key": "e1afe080ecf3565b0103214c21f49e8b03741024", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.7090191185860464, "ground_truth": 0}, {"key": "e1afe080ecf3565b0103214c21f49e8b03741024", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.8322366602004474, "ground_truth": 0}, {"key": "e1afe080ecf3565b0103214c21f49e8b03741024", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.6791787087327269, "ground_truth": 0}, {"key": "05fa6152f08a3d64745030124428775768ee3afd", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.8019358294867346, "ground_truth": 0}, {"key": "05fa6152f08a3d64745030124428775768ee3afd", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.9130583335664538, "ground_truth": 0}, {"key": "05fa6152f08a3d64745030124428775768ee3afd", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.8548846373248301, "ground_truth": 0}, {"key": "05fa6152f08a3d64745030124428775768ee3afd", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.9532750430944986, "ground_truth": 0}, {"key": "05fa6152f08a3d64745030124428775768ee3afd", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.9246876960982124, "ground_truth": 0}, {"key": "8f80054060e5c2dde57666b5e3bddf6b70b34f3f", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.7905303392670531, "ground_truth": 0}, {"key": "8f80054060e5c2dde57666b5e3bddf6b70b34f3f", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.8519528163304894, "ground_truth": 0}, {"key": "8f80054060e5c2dde57666b5e3bddf6b70b34f3f", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.8714748577639044, "ground_truth": 0}, {"key": "8f80054060e5c2dde57666b5e3bddf6b70b34f3f", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.8910549560832518, "ground_truth": 0}, {"key": "8f80054060e5c2dde57666b5e3bddf6b70b34f3f", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.8044059214941579, "ground_truth": 0}, {"key": "f63877ffefceaf9a2a13a9277f4d861f9b9b8a73", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.7981867826412787, "ground_truth": 0}, {"key": "f63877ffefceaf9a2a13a9277f4d861f9b9b8a73", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.7520125750940144, "ground_truth": 0}, {"key": "f63877ffefceaf9a2a13a9277f4d861f9b9b8a73", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.8509646988476829, "ground_truth": 0}, {"key": "f63877ffefceaf9a2a13a9277f4d861f9b9b8a73", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.8289388240125506, "ground_truth": 0}, {"key": "f63877ffefceaf9a2a13a9277f4d861f9b9b8a73", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.8428631505527909, "ground_truth": 0}, {"key": "e1e0fbee1f5df559fda3830710afb660f33cb7b5", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.8587185689005946, "ground_truth": 0}, {"key": "e1e0fbee1f5df559fda3830710afb660f33cb7b5", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.7520125514738187, "ground_truth": 0}, {"key": "e1e0fbee1f5df559fda3830710afb660f33cb7b5", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.660172399993948, "ground_truth": 0}, {"key": "e1e0fbee1f5df559fda3830710afb660f33cb7b5", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.8661325105740518, "ground_truth": 0}, {"key": "e1e0fbee1f5df559fda3830710afb660f33cb7b5", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.7662936444234014, "ground_truth": 0}, {"key": "7d66246dc75062c5616067bbb379962c3934e52f", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.8643104557913146, "ground_truth": 0}, {"key": "7d66246dc75062c5616067bbb379962c3934e52f", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.8210441018371043, "ground_truth": 0}, {"key": "7d66246dc75062c5616067bbb379962c3934e52f", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.7732163629757118, "ground_truth": 0}, {"key": "7d66246dc75062c5616067bbb379962c3934e52f", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.8774767877133074, "ground_truth": 0}, {"key": "7d66246dc75062c5616067bbb379962c3934e52f", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.7931059410165724, "ground_truth": 0}, {"key": "09e62b334425ef4eee26be483a625858c91340eb", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.7905303122559298, "ground_truth": 0}, {"key": "09e62b334425ef4eee26be483a625858c91340eb", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.8824278698317826, "ground_truth": 0}, {"key": "09e62b334425ef4eee26be483a625858c91340eb", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.838679760729538, "ground_truth": 0}, {"key": "09e62b334425ef4eee26be483a625858c91340eb", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.7826624697293588, "ground_truth": 0}, {"key": "09e62b334425ef4eee26be483a625858c91340eb", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.7074047064435817, "ground_truth": 0}, {"key": "32e769b0ced3ffbf79f695af69a2401897156c8c", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.8210441135503243, "ground_truth": 0}, {"key": "32e769b0ced3ffbf79f695af69a2401897156c8c", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.8459424382844181, "ground_truth": 0}, {"key": "32e769b0ced3ffbf79f695af69a2401897156c8c", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.8080672068153734, "ground_truth": 0}, {"key": "32e769b0ced3ffbf79f695af69a2401897156c8c", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.8624675298445862, "ground_truth": 0}, {"key": "32e769b0ced3ffbf79f695af69a2401897156c8c", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.773216377123021, "ground_truth": 0}, {"key": "43d42fe40ada4406377bc3b45c123a75552c21a0", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.8128673228873251, "ground_truth": 0}, {"key": "43d42fe40ada4406377bc3b45c123a75552c21a0", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.5813030720908449, "ground_truth": 0}, {"key": "43d42fe40ada4406377bc3b45c123a75552c21a0", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.6406358618870739, "ground_truth": 0}, {"key": "43d42fe40ada4406377bc3b45c123a75552c21a0", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.6352224408799584, "ground_truth": 0}, {"key": "43d42fe40ada4406377bc3b45c123a75552c21a0", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.7401743533442344, "ground_truth": 0}, {"key": "cec3e977a612e1481913d63934cfe578b9bcf3be", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.8783142423946221, "ground_truth": 0}, {"key": "cec3e977a612e1481913d63934cfe578b9bcf3be", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.8723473809336798, "ground_truth": 0}, {"key": "cec3e977a612e1481913d63934cfe578b9bcf3be", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.8816148977745192, "ground_truth": 0}, {"key": "cec3e977a612e1481913d63934cfe578b9bcf3be", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.8661325075586022, "ground_truth": 0}, {"key": "cec3e977a612e1481913d63934cfe578b9bcf3be", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.8509646913935109, "ground_truth": 0}, {"key": "2572185d9544f23c4ad02aeac1ae8ab7828fb4be", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.6406358473936797, "ground_truth": 0}, {"key": "2572185d9544f23c4ad02aeac1ae8ab7828fb4be", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.9458012715954397, "ground_truth": 0}, {"key": "2572185d9544f23c4ad02aeac1ae8ab7828fb4be", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.8104789034046233, "ground_truth": 0}, {"key": "2572185d9544f23c4ad02aeac1ae8ab7828fb4be", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.7606506439512766, "ground_truth": 0}, {"key": "2572185d9544f23c4ad02aeac1ae8ab7828fb4be", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.8322366476032849, "ground_truth": 0}, {"key": "3cc7c9639fb87922cfac315fbb55641e671a3d99", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.7759445343869598, "ground_truth": 0}, {"key": "3cc7c9639fb87922cfac315fbb55641e671a3d99", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.731058564318498, "ground_truth": 0}, {"key": "3cc7c9639fb87922cfac315fbb55641e671a3d99", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.6893056105430525, "ground_truth": 0}, {"key": "3cc7c9639fb87922cfac315fbb55641e671a3d99", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.66714766867273, "ground_truth": 0}, {"key": "3cc7c9639fb87922cfac315fbb55641e671a3d99", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.830043763194712, "ground_truth": 0}, {"key": "374ae10f9cbb0719c889321f880a0671892336e4", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.8606036149893048, "ground_truth": 0}, {"key": "374ae10f9cbb0719c889321f880a0671892336e4", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.817574466627073, "ground_truth": 0}, {"key": "374ae10f9cbb0719c889321f880a0671892336e4", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.7786493126839472, "ground_truth": 0}, {"key": "374ae10f9cbb0719c889321f880a0671892336e4", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.9219218383935147, "ground_truth": 0}, {"key": "374ae10f9cbb0719c889321f880a0671892336e4", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.7981867736655174, "ground_truth": 0}, {"key": "89a7bb5a0b120c5b50e9145c8f8f9bea3a90371a", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.9656413099652559, "ground_truth": 0}, {"key": "89a7bb5a0b120c5b50e9145c8f8f9bea3a90371a", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.9149009517544305, "ground_truth": 0}, {"key": "89a7bb5a0b120c5b50e9145c8f8f9bea3a90371a", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.9046505380771158, "ground_truth": 0}, {"key": "89a7bb5a0b120c5b50e9145c8f8f9bea3a90371a", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.9073122224124123, "ground_truth": 0}, {"key": "89a7bb5a0b120c5b50e9145c8f8f9bea3a90371a", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.8887587852215486, "ground_truth": 0}, {"key": "49d4ad731a44b7576e3e3271b1eee2f0219883c2", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.7217432148712518, "ground_truth": 0}, {"key": "49d4ad731a44b7576e3e3271b1eee2f0219883c2", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.8774767823191466, "ground_truth": 0}, {"key": "49d4ad731a44b7576e3e3271b1eee2f0219883c2", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.712232185079089, "ground_truth": 0}, {"key": "49d4ad731a44b7576e3e3271b1eee2f0219883c2", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.7090191117728432, "ground_truth": 0}, {"key": "49d4ad731a44b7576e3e3271b1eee2f0219883c2", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.8407825960579817, "ground_truth": 0}, {"key": "ab3c9bac8bcfef89da719c4aba8ea4eee71e4daf", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.8879840463652626, "ground_truth": 0}, {"key": "ab3c9bac8bcfef89da719c4aba8ea4eee71e4daf", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.891054948520016, "ground_truth": 0}, {"key": "ab3c9bac8bcfef89da719c4aba8ea4eee71e4daf", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.8872045989789925, "ground_truth": 0}, {"key": "ab3c9bac8bcfef89da719c4aba8ea4eee71e4daf", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.9005297882200561, "ground_truth": 0}, {"key": "ab3c9bac8bcfef89da719c4aba8ea4eee71e4daf", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.8210440943142927, "ground_truth": 0}, {"key": "eb8b1cf7cf4ab7ad23ef6094cfe69348563aecc8", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.8031737839497772, "ground_truth": 0}, {"key": "eb8b1cf7cf4ab7ad23ef6094cfe69348563aecc8", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.8311430495745019, "ground_truth": 0}, {"key": "eb8b1cf7cf4ab7ad23ef6094cfe69348563aecc8", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.87831424465447, "ground_truth": 0}, {"key": "eb8b1cf7cf4ab7ad23ef6094cfe69348563aecc8", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.8418256412266063, "ground_truth": 0}, {"key": "eb8b1cf7cf4ab7ad23ef6094cfe69348563aecc8", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.7704647842611061, "ground_truth": 0}, {"key": "e944a5cbd4265e43f422c172b930a60b7de190cc", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.6057990566114408, "ground_truth": 0}, {"key": "e944a5cbd4265e43f422c172b930a60b7de190cc", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.8428631454488987, "ground_truth": 0}, {"key": "e944a5cbd4265e43f422c172b930a60b7de190cc", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.5175708750564927, "ground_truth": 0}, {"key": "e944a5cbd4265e43f422c172b930a60b7de190cc", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.5983122118142831, "ground_truth": 0}, {"key": "e944a5cbd4265e43f422c172b930a60b7de190cc", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.5851011770227009, "ground_truth": 0}, {"key": "ef96a6c54daaf4fef676a69305e26fa1d4788bdd", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.8221891236402287, "ground_truth": 0}, {"key": "ef96a6c54daaf4fef676a69305e26fa1d4788bdd", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.8006920060218672, "ground_truth": 0}, {"key": "ef96a6c54daaf4fef676a69305e26fa1d4788bdd", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.83867977121929, "ground_truth": 0}, {"key": "ef96a6c54daaf4fef676a69305e26fa1d4788bdd", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.8740772257453925, "ground_truth": 0}, {"key": "ef96a6c54daaf4fef676a69305e26fa1d4788bdd", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.8548846384779661, "ground_truth": 0}, {"key": "d9ec8c3e50de1d5af4524c26c6819e17b64090aa", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.6636689589548515, "ground_truth": 0}, {"key": "d9ec8c3e50de1d5af4524c26c6819e17b64090aa", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.8267117962920235, "ground_truth": 0}, {"key": "d9ec8c3e50de1d5af4524c26c6819e17b64090aa", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.6808786184888453, "ground_truth": 0}, {"key": "d9ec8c3e50de1d5af4524c26c6819e17b64090aa", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.7969253627308313, "ground_truth": 0}, {"key": "d9ec8c3e50de1d5af4524c26c6819e17b64090aa", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.7154240012766548, "ground_truth": 0}, {"key": "b6072611b97e8c19ba2d7e0dfce153f046dd629d", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.5234203489519834, "ground_truth": 0}, {"key": "b6072611b97e8c19ba2d7e0dfce153f046dd629d", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.6261241841609513, "ground_truth": 0}, {"key": "b6072611b97e8c19ba2d7e0dfce153f046dd629d", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.8244619348118278, "ground_truth": 0}, {"key": "b6072611b97e8c19ba2d7e0dfce153f046dd629d", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.85966374390896, "ground_truth": 0}, {"key": "b6072611b97e8c19ba2d7e0dfce153f046dd629d", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.7476159462641034, "ground_truth": 0}, {"key": "2cf81cee664ebcb027a48259e34e512a79aceecb", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.9079671339524403, "ground_truth": 0}, {"key": "2cf81cee664ebcb027a48259e34e512a79aceecb", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.8910549552246437, "ground_truth": 0}, {"key": "2cf81cee664ebcb027a48259e34e512a79aceecb", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.925768635833949, "ground_truth": 0}, {"key": "2cf81cee664ebcb027a48259e34e512a79aceecb", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.8807970788991324, "ground_truth": 0}, {"key": "2cf81cee664ebcb027a48259e34e512a79aceecb", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.8918110412907412, "ground_truth": 0}, {"key": "b037b44fc06a2d89d95dc7b4453b87371a34fe2f", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.925768633402468, "ground_truth": 0}, {"key": "b037b44fc06a2d89d95dc7b4453b87371a34fe2f", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.9149009517544305, "ground_truth": 0}, {"key": "b037b44fc06a2d89d95dc7b4453b87371a34fe2f", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.9252299526521908, "ground_truth": 0}, {"key": "b037b44fc06a2d89d95dc7b4453b87371a34fe2f", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.9600626842510779, "ground_truth": 0}, {"key": "b037b44fc06a2d89d95dc7b4453b87371a34fe2f", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.9372107906956856, "ground_truth": 0}, {"key": "b1ea881f21e2b58e247b5894d4f259cf86b4d1dd", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.935346511684572, "ground_truth": 0}, {"key": "b1ea881f21e2b58e247b5894d4f259cf86b4d1dd", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.8210440957265056, "ground_truth": 0}, {"key": "b1ea881f21e2b58e247b5894d4f259cf86b4d1dd", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.9376689617939865, "ground_truth": 0}, {"key": "b1ea881f21e2b58e247b5894d4f259cf86b4d1dd", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.882427859868533, "ground_truth": 0}, {"key": "b1ea881f21e2b58e247b5894d4f259cf86b4d1dd", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.9433475795702837, "ground_truth": 0}, {"key": "d80e6a3be826df05df00a87f49cc426fd597f085", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.9790357590689276, "ground_truth": 0}, {"key": "d80e6a3be826df05df00a87f49cc426fd597f085", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.9618217244143049, "ground_truth": 0}, {"key": "d80e6a3be826df05df00a87f49cc426fd597f085", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.9700134955747992, "ground_truth": 0}, {"key": "d80e6a3be826df05df00a87f49cc426fd597f085", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.9656413106249028, "ground_truth": 0}, {"key": "d80e6a3be826df05df00a87f49cc426fd597f085", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.9702399046487289, "ground_truth": 0}, {"key": "05216d3837745866d393f0e07be7ba801dc330f6", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.8955226874588458, "ground_truth": 0}, {"key": "05216d3837745866d393f0e07be7ba801dc330f6", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.9412234446081909, "ground_truth": 0}, {"key": "05216d3837745866d393f0e07be7ba801dc330f6", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.9299510394754256, "ground_truth": 0}, {"key": "05216d3837745866d393f0e07be7ba801dc330f6", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.9019206715233861, "ground_truth": 0}, {"key": "05216d3837745866d393f0e07be7ba801dc330f6", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.9196425329150318, "ground_truth": 0}, {"key": "a204e3551445183cf53ae355e532a2db731c0c30", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.9086178975435668, "ground_truth": 0}, {"key": "a204e3551445183cf53ae355e532a2db731c0c30", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.8449215254713547, "ground_truth": 0}, {"key": "a204e3551445183cf53ae355e532a2db731c0c30", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.8962513700273341, "ground_truth": 0}, {"key": "a204e3551445183cf53ae355e532a2db731c0c30", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.9173026630503289, "ground_truth": 0}, {"key": "a204e3551445183cf53ae355e532a2db731c0c30", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.8679338476545625, "ground_truth": 0}, {"key": "047e7bc4c7ea5f7df08d4efc443ac8a3479649f1", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.9314625100679264, "ground_truth": 0}, {"key": "047e7bc4c7ea5f7df08d4efc443ac8a3479649f1", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.9339146270013887, "ground_truth": 0}, {"key": "047e7bc4c7ea5f7df08d4efc443ac8a3479649f1", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.9202179847881843, "ground_truth": 0}, {"key": "047e7bc4c7ea5f7df08d4efc443ac8a3479649f1", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.9462003530242533, "ground_truth": 0}, {"key": "047e7bc4c7ea5f7df08d4efc443ac8a3479649f1", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.9149009573439943, "ground_truth": 0}, {"key": "dee467e11f253e70ec843c45fb373da06eace6be", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.9219218365653138, "ground_truth": 0}, {"key": "dee467e11f253e70ec843c45fb373da06eace6be", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.9348724543514947, "ground_truth": 0}, {"key": "dee467e11f253e70ec843c45fb373da06eace6be", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.9353465166667707, "ground_truth": 0}, {"key": "dee467e11f253e70ec843c45fb373da06eace6be", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.9522199350767516, "ground_truth": 0}, {"key": "dee467e11f253e70ec843c45fb373da06eace6be", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.9136765310879137, "ground_truth": 0}, {"key": "054891b9199a73152564cc5be925250ea282bb00", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.8175744723276165, "ground_truth": 0}, {"key": "054891b9199a73152564cc5be925250ea282bb00", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.7662936653968161, "ground_truth": 0}, {"key": "054891b9199a73152564cc5be925250ea282bb00", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.7662936423109021, "ground_truth": 0}, {"key": "054891b9199a73152564cc5be925250ea282bb00", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.7401743436587245, "ground_truth": 0}, {"key": "054891b9199a73152564cc5be925250ea282bb00", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.7386690735589878, "ground_truth": 0}, {"key": "82a94cf607660eb67aac057e3f5028c4cae75abf", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.903974509005215, "ground_truth": 0}, {"key": "82a94cf607660eb67aac057e3f5028c4cae75abf", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.8233283941264058, "ground_truth": 0}, {"key": "82a94cf607660eb67aac057e3f5028c4cae75abf", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.8376199728199554, "ground_truth": 0}, {"key": "82a94cf607660eb67aac057e3f5028c4cae75abf", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.8311430379489413, "ground_truth": 0}, {"key": "82a94cf607660eb67aac057e3f5028c4cae75abf", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.9136765290472959, "ground_truth": 0}, {"key": "58bf14c936eb7e9a6561599014fefd77ef6c457e", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.9124361543887952, "ground_truth": 0}, {"key": "58bf14c936eb7e9a6561599014fefd77ef6c457e", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.9367494752875726, "ground_truth": 0}, {"key": "58bf14c936eb7e9a6561599014fefd77ef6c457e", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.9522199322722047, "ground_truth": 0}, {"key": "58bf14c936eb7e9a6561599014fefd77ef6c457e", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.9656413101895581, "ground_truth": 0}, {"key": "58bf14c936eb7e9a6561599014fefd77ef6c457e", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.9420819124056108, "ground_truth": 0}, {"key": "5574fe023e3127f0c206ac89eb06abf5a7400438", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.5486734853776779, "ground_truth": 0}, {"key": "5574fe023e3127f0c206ac89eb06abf5a7400438", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.7041601196251432, "ground_truth": 0}, {"key": "5574fe023e3127f0c206ac89eb06abf5a7400438", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.6187804250037412, "ground_truth": 0}, {"key": "5574fe023e3127f0c206ac89eb06abf5a7400438", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.7090191479998198, "ground_truth": 0}, {"key": "5574fe023e3127f0c206ac89eb06abf5a7400438", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.546738136627397, "ground_truth": 0}, {"key": "e88be1fa30cb6557d422788b5c469b7ba7ca8bfc", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.880797077288121, "ground_truth": 0}, {"key": "e88be1fa30cb6557d422788b5c469b7ba7ca8bfc", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.9643214460530596, "ground_truth": 0}, {"key": "e88be1fa30cb6557d422788b5c469b7ba7ca8bfc", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.8791467735516164, "ground_truth": 0}, {"key": "e88be1fa30cb6557d422788b5c469b7ba7ca8bfc", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.952219933288469, "ground_truth": 0}, {"key": "e88be1fa30cb6557d422788b5c469b7ba7ca8bfc", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.8848377741161172, "ground_truth": 0}, {"key": "62f05476ec5198ceb345ce4f45d7d0e70f499ad7", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.8006919888696752, "ground_truth": 0}, {"key": "62f05476ec5198ceb345ce4f45d7d0e70f499ad7", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.8519528172688023, "ground_truth": 0}, {"key": "62f05476ec5198ceb345ce4f45d7d0e70f499ad7", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.8175744763809284, "ground_truth": 0}, {"key": "62f05476ec5198ceb345ce4f45d7d0e70f499ad7", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.6352224327130996, "ground_truth": 0}, {"key": "62f05476ec5198ceb345ce4f45d7d0e70f499ad7", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.8469578439127656, "ground_truth": 0}, {"key": "8cc719f761556a81a71c2dd1b703749c2059df10", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.8539127565037924, "ground_truth": 0}, {"key": "8cc719f761556a81a71c2dd1b703749c2059df10", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.9263037321592904, "ground_truth": 0}, {"key": "8cc719f761556a81a71c2dd1b703749c2059df10", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.8006920019161928, "ground_truth": 0}, {"key": "8cc719f761556a81a71c2dd1b703749c2059df10", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.8221891377201046, "ground_truth": 0}, {"key": "8cc719f761556a81a71c2dd1b703749c2059df10", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.889528853820243, "ground_truth": 0}, {"key": "2d89b0d0827a0a1e9e855de7717407cdff63b1f5", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.6187804590570066, "ground_truth": 0}, {"key": "2d89b0d0827a0a1e9e855de7717407cdff63b1f5", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.7106282909787092, "ground_truth": 0}, {"key": "2d89b0d0827a0a1e9e855de7717407cdff63b1f5", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.7356416314781146, "ground_truth": 0}, {"key": "2d89b0d0827a0a1e9e855de7717407cdff63b1f5", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.6893056408870438, "ground_truth": 0}, {"key": "2d89b0d0827a0a1e9e855de7717407cdff63b1f5", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.5389832125325056, "ground_truth": 0}, {"key": "41431356e1e7c6f94057b262cd284987f9edb184", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.7201714908034446, "ground_truth": 0}, {"key": "41431356e1e7c6f94057b262cd284987f9edb184", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.6671476634142514, "ground_truth": 0}, {"key": "41431356e1e7c6f94057b262cd284987f9edb184", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.585101178011838, "ground_truth": 0}, {"key": "41431356e1e7c6f94057b262cd284987f9edb184", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.6723317036427755, "ground_truth": 0}, {"key": "41431356e1e7c6f94057b262cd284987f9edb184", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.6876300004702441, "ground_truth": 0}, {"key": "50872fa30632af8f4c65fb9f952ea8e1b13043c9", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.8104789044419084, "ground_truth": 0}, {"key": "50872fa30632af8f4c65fb9f952ea8e1b13043c9", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.7476159602383103, "ground_truth": 0}, {"key": "50872fa30632af8f4c65fb9f952ea8e1b13043c9", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.7969253720754564, "ground_truth": 0}, {"key": "50872fa30632af8f4c65fb9f952ea8e1b13043c9", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.8705972781639881, "ground_truth": 0}, {"key": "50872fa30632af8f4c65fb9f952ea8e1b13043c9", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.7981867792471826, "ground_truth": 0}, {"key": "4a403faad8116c40f4cb960d3ffad081106341ad", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.5888891261304098, "ground_truth": 0}, {"key": "4a403faad8116c40f4cb960d3ffad081106341ad", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.7057850186817324, "ground_truth": 0}, {"key": "4a403faad8116c40f4cb960d3ffad081106341ad", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.6460136857153997, "ground_truth": 0}, {"key": "4a403faad8116c40f4cb960d3ffad081106341ad", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.8019358216552608, "ground_truth": 0}, {"key": "4a403faad8116c40f4cb960d3ffad081106341ad", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.5698526641108681, "ground_truth": 0}, {"key": "6f6964470c122807573653173b45b8e00bb59696", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.9529258189359707, "ground_truth": 0}, {"key": "6f6964470c122807573653173b45b8e00bb59696", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.935817357324322, "ground_truth": 0}, {"key": "6f6964470c122807573653173b45b8e00bb59696", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.9190632898131509, "ground_truth": 0}, {"key": "6f6964470c122807573653173b45b8e00bb59696", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.9726235096861151, "ground_truth": 0}, {"key": "6f6964470c122807573653173b45b8e00bb59696", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.9416541612660602, "ground_truth": 0}, {"key": "75c6e27a38b72bb9f75fa2b8e45e933bae10dac5", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.9367494744698857, "ground_truth": 0}, {"key": "75c6e27a38b72bb9f75fa2b8e45e933bae10dac5", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.9289263304607328, "ground_truth": 0}, {"key": "75c6e27a38b72bb9f75fa2b8e45e933bae10dac5", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.8864204122400182, "ground_truth": 0}, {"key": "75c6e27a38b72bb9f75fa2b8e45e933bae10dac5", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.945399397258204, "ground_truth": 0}, {"key": "75c6e27a38b72bb9f75fa2b8e45e933bae10dac5", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.8816148967199566, "ground_truth": 0}, {"key": "9aa6463127d1efcba4403a185b29849a3688db8d", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.7879311943177133, "ground_truth": 0}, {"key": "9aa6463127d1efcba4403a185b29849a3688db8d", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.7853085808002893, "ground_truth": 0}, {"key": "9aa6463127d1efcba4403a185b29849a3688db8d", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.870597269401709, "ground_truth": 0}, {"key": "9aa6463127d1efcba4403a185b29849a3688db8d", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.7690802387125806, "ground_truth": 0}, {"key": "9aa6463127d1efcba4403a185b29849a3688db8d", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.8587185874333557, "ground_truth": 0}, {"key": "97eda06b374f07cd9495962465775bde7d44da31", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.778649311518437, "ground_truth": 0}, {"key": "97eda06b374f07cd9495962465775bde7d44da31", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.8354835458639724, "ground_truth": 0}, {"key": "97eda06b374f07cd9495962465775bde7d44da31", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.917893365697301, "ground_truth": 0}, {"key": "97eda06b374f07cd9495962465775bde7d44da31", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.8688267730019756, "ground_truth": 0}, {"key": "97eda06b374f07cd9495962465775bde7d44da31", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.8568122882371315, "ground_truth": 0}, {"key": "99a6049d67c1cee35f9703ccb8e6f62a4928295a", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.8548846375239559, "ground_truth": 0}, {"key": "99a6049d67c1cee35f9703ccb8e6f62a4928295a", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.942928602427569, "ground_truth": 0}, {"key": "99a6049d67c1cee35f9703ccb8e6f62a4928295a", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.7879311847245788, "ground_truth": 0}, {"key": "99a6049d67c1cee35f9703ccb8e6f62a4928295a", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.8832359936853517, "ground_truth": 0}, {"key": "99a6049d67c1cee35f9703ccb8e6f62a4928295a", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.8872046042209338, "ground_truth": 0}, {"key": "adcb3e7b4bef0f9efe7a838b56131ca99b587743", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.605799051300752, "ground_truth": 0}, {"key": "adcb3e7b4bef0f9efe7a838b56131ca99b587743", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.715423991886515, "ground_truth": 0}, {"key": "adcb3e7b4bef0f9efe7a838b56131ca99b587743", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.7170118622891177, "ground_truth": 0}, {"key": "adcb3e7b4bef0f9efe7a838b56131ca99b587743", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.7138307346537741, "ground_truth": 0}, {"key": "adcb3e7b4bef0f9efe7a838b56131ca99b587743", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.7879311867183675, "ground_truth": 0}, {"key": "bf7cc4e7872b7471a8ef858b8aa45eca090171da", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.7931059427040014, "ground_truth": 0}, {"key": "bf7cc4e7872b7471a8ef858b8aa45eca090171da", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.7853085784362016, "ground_truth": 0}, {"key": "bf7cc4e7872b7471a8ef858b8aa45eca090171da", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.8044059225578921, "ground_truth": 0}, {"key": "bf7cc4e7872b7471a8ef858b8aa45eca090171da", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.8152324796678054, "ground_truth": 0}, {"key": "bf7cc4e7872b7471a8ef858b8aa45eca090171da", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.6757646025964915, "ground_truth": 0}, {"key": "62785b99e4007fad95ce55d427046e14aef476a4", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.7931059410645562, "ground_truth": 0}, {"key": "62785b99e4007fad95ce55d427046e14aef476a4", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.7295197873152259, "ground_truth": 0}, {"key": "62785b99e4007fad95ce55d427046e14aef476a4", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.6477982227721651, "ground_truth": 0}, {"key": "62785b99e4007fad95ce55d427046e14aef476a4", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.7233094643225046, "ground_truth": 0}, {"key": "62785b99e4007fad95ce55d427046e14aef476a4", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.7620700962837563, "ground_truth": 0}, {"key": "62fcd4ca096a182c292ae3609444bbc7af15eab6", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.8104788977154841, "ground_truth": 0}, {"key": "62fcd4ca096a182c292ae3609444bbc7af15eab6", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.7879311994100113, "ground_truth": 0}, {"key": "62fcd4ca096a182c292ae3609444bbc7af15eab6", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.727975436791453, "ground_truth": 0}, {"key": "62fcd4ca096a182c292ae3609444bbc7af15eab6", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.7969253702393413, "ground_truth": 0}, {"key": "62fcd4ca096a182c292ae3609444bbc7af15eab6", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.835483541588366, "ground_truth": 0}, {"key": "afdbd1bc7c79a936601b3c6cae4622464641d3a5", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.8969755789559734, "ground_truth": 0}, {"key": "afdbd1bc7c79a936601b3c6cae4622464641d3a5", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.8864204145337425, "ground_truth": 0}, {"key": "afdbd1bc7c79a936601b3c6cae4622464641d3a5", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.8856314708170738, "ground_truth": 0}, {"key": "afdbd1bc7c79a936601b3c6cae4622464641d3a5", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.8749346161623623, "ground_truth": 0}, {"key": "afdbd1bc7c79a936601b3c6cae4622464641d3a5", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.8548846380687015, "ground_truth": 0}, {"key": "2a2a0fd7b85ec6f9145761795bae420d7eb84f44", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.8104789071027056, "ground_truth": 0}, {"key": "2a2a0fd7b85ec6f9145761795bae420d7eb84f44", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.7799928987776861, "ground_truth": 0}, {"key": "2a2a0fd7b85ec6f9145761795bae420d7eb84f44", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.7634837607388193, "ground_truth": 0}, {"key": "2a2a0fd7b85ec6f9145761795bae420d7eb84f44", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.7879312047116827, "ground_truth": 0}, {"key": "2a2a0fd7b85ec6f9145761795bae420d7eb84f44", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.8333245945109771, "ground_truth": 0}, {"key": "f3d07208d0059d738fc7788a4ce813309b677d7b", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.8056321977159572, "ground_truth": 0}, {"key": "f3d07208d0059d738fc7788a4ce813309b677d7b", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.7401743495728174, "ground_truth": 0}, {"key": "f3d07208d0059d738fc7788a4ce813309b677d7b", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.8509647100329014, "ground_truth": 0}, {"key": "f3d07208d0059d738fc7788a4ce813309b677d7b", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.7634837512481579, "ground_truth": 0}, {"key": "f3d07208d0059d738fc7788a4ce813309b677d7b", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.7718434873969121, "ground_truth": 0}, {"key": "2b8840981769a4a8f93d2e82e609ab169165cd3c", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.7233094720745803, "ground_truth": 0}, {"key": "2b8840981769a4a8f93d2e82e609ab169165cd3c", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.8449215336662088, "ground_truth": 0}, {"key": "2b8840981769a4a8f93d2e82e609ab169165cd3c", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.8080672079339749, "ground_truth": 0}, {"key": "2b8840981769a4a8f93d2e82e609ab169165cd3c", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.6706082755899496, "ground_truth": 0}, {"key": "2b8840981769a4a8f93d2e82e609ab169165cd3c", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.8322366536327167, "ground_truth": 0}, {"key": "4b23ce1db7253bf118b493c9bea7d6899012cc88", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.7217432034385215, "ground_truth": 0}, {"key": "4b23ce1db7253bf118b493c9bea7d6899012cc88", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.8344068828856402, "ground_truth": 0}, {"key": "4b23ce1db7253bf118b493c9bea7d6899012cc88", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.7853085861375407, "ground_truth": 0}, {"key": "4b23ce1db7253bf118b493c9bea7d6899012cc88", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.6406358671153698, "ground_truth": 0}, {"key": "4b23ce1db7253bf118b493c9bea7d6899012cc88", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.6169358134376164, "ground_truth": 0}, {"key": "c220780a60f76cdd1f6fd9a84abac736c3ee8ace", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.8221891304358876, "ground_truth": 0}, {"key": "c220780a60f76cdd1f6fd9a84abac736c3ee8ace", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.8164063780586837, "ground_truth": 0}, {"key": "c220780a60f76cdd1f6fd9a84abac736c3ee8ace", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.7745833856792047, "ground_truth": 0}, {"key": "c220780a60f76cdd1f6fd9a84abac736c3ee8ace", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.8386797528612823, "ground_truth": 0}, {"key": "c220780a60f76cdd1f6fd9a84abac736c3ee8ace", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.8910549551056816, "ground_truth": 0}, {"key": "9c7687a36469fc0e2203edb31f303274a611fb12", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.5409238491264765, "ground_truth": 0}, {"key": "9c7687a36469fc0e2203edb31f303274a611fb12", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.7386690870724769, "ground_truth": 0}, {"key": "9c7687a36469fc0e2203edb31f303274a611fb12", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.6706082807638807, "ground_truth": 0}, {"key": "9c7687a36469fc0e2203edb31f303274a611fb12", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.8244619351098367, "ground_truth": 0}, {"key": "9c7687a36469fc0e2203edb31f303274a611fb12", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.5945512573725303, "ground_truth": 0}, {"key": "8ab7fe3b19bb45c977cb74ed675579a20611ad9b", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.8221891372133309, "ground_truth": 0}, {"key": "8ab7fe3b19bb45c977cb74ed675579a20611ad9b", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.7356416548959605, "ground_truth": 0}, {"key": "8ab7fe3b19bb45c977cb74ed675579a20611ad9b", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.7025300643616396, "ground_truth": 0}, {"key": "8ab7fe3b19bb45c977cb74ed675579a20611ad9b", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.6943026633293865, "ground_truth": 0}, {"key": "8ab7fe3b19bb45c977cb74ed675579a20611ad9b", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.6636689436716314, "ground_truth": 0}, {"key": "dfedf6786976733d8e33e7848ea8a7aa735bbcab", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.7772998520251835, "ground_truth": 0}, {"key": "dfedf6786976733d8e33e7848ea8a7aa735bbcab", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.7745833875996776, "ground_truth": 0}, {"key": "dfedf6786976733d8e33e7848ea8a7aa735bbcab", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.8697145808222817, "ground_truth": 0}, {"key": "dfedf6786976733d8e33e7848ea8a7aa735bbcab", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.8244619397077069, "ground_truth": 0}, {"key": "dfedf6786976733d8e33e7848ea8a7aa735bbcab", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.7534666549220939, "ground_truth": 0}, {"key": "825f58580dd78cdcc7fbc10a00807e043c7b4468", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.8267117942427843, "ground_truth": 0}, {"key": "825f58580dd78cdcc7fbc10a00807e043c7b4468", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.7676898494848097, "ground_truth": 0}, {"key": "825f58580dd78cdcc7fbc10a00807e043c7b4468", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.7592254062915916, "ground_truth": 0}, {"key": "825f58580dd78cdcc7fbc10a00807e043c7b4468", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.6584175075785161, "ground_truth": 0}, {"key": "825f58580dd78cdcc7fbc10a00807e043c7b4468", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.749087210225939, "ground_truth": 0}, {"key": "8bd6dc9f3ebb23fe20f74c1956184064b5b95509", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.6671476789986331, "ground_truth": 0}, {"key": "8bd6dc9f3ebb23fe20f74c1956184064b5b95509", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.8267117962920235, "ground_truth": 0}, {"key": "8bd6dc9f3ebb23fe20f74c1956184064b5b95509", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.7233094663267015, "ground_truth": 0}, {"key": "8bd6dc9f3ebb23fe20f74c1956184064b5b95509", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.7090191391489696, "ground_truth": 0}, {"key": "8bd6dc9f3ebb23fe20f74c1956184064b5b95509", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.6334102631521769, "ground_truth": 0}, {"key": "a7f6d4487a3ba7c4fc29e9b410820891f4c4f086", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.9309620727451242, "ground_truth": 0}, {"key": "a7f6d4487a3ba7c4fc29e9b410820891f4c4f086", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.9433475767323783, "ground_truth": 0}, {"key": "a7f6d4487a3ba7c4fc29e9b410820891f4c4f086", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.9235923271251728, "ground_truth": 0}, {"key": "a7f6d4487a3ba7c4fc29e9b410820891f4c4f086", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.9066531165525178, "ground_truth": 0}, {"key": "a7f6d4487a3ba7c4fc29e9b410820891f4c4f086", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.921921838835838, "ground_truth": 0}, {"key": "b27ad09982665477dacdb7d06a33134bf064dd8d", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.7356416313946791, "ground_truth": 0}, {"key": "b27ad09982665477dacdb7d06a33134bf064dd8d", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.8955226811934934, "ground_truth": 0}, {"key": "b27ad09982665477dacdb7d06a33134bf064dd8d", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.8606036159379633, "ground_truth": 0}, {"key": "b27ad09982665477dacdb7d06a33134bf064dd8d", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.6370308025481487, "ground_truth": 0}, {"key": "b27ad09982665477dacdb7d06a33134bf064dd8d", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.8255897263519498, "ground_truth": 0}, {"key": "905891c3a21e76ad63d63dfe55e569a4cab25583", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.6842640191388053, "ground_truth": 0}, {"key": "905891c3a21e76ad63d63dfe55e569a4cab25583", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.8469578365261693, "ground_truth": 0}, {"key": "905891c3a21e76ad63d63dfe55e569a4cab25583", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.8757869867213741, "ground_truth": 0}, {"key": "905891c3a21e76ad63d63dfe55e569a4cab25583", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.9032942131110061, "ground_truth": 0}, {"key": "905891c3a21e76ad63d63dfe55e569a4cab25583", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.8840392810884475, "ground_truth": 0}, {"key": "626460b8ec58252c82ff5513aa754190332780aa", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.7233094660632298, "ground_truth": 0}, {"key": "626460b8ec58252c82ff5513aa754190332780aa", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.7185943886378986, "ground_truth": 0}, {"key": "626460b8ec58252c82ff5513aa754190332780aa", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.7563575435721094, "ground_truth": 0}, {"key": "626460b8ec58252c82ff5513aa754190332780aa", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.6460136936298648, "ground_truth": 0}, {"key": "626460b8ec58252c82ff5513aa754190332780aa", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.8056321787964987, "ground_truth": 0}, {"key": "31d0ed7b1b8f65c6479fb35683d72de21d70796a", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.9840936083627551, "ground_truth": 0}, {"key": "31d0ed7b1b8f65c6479fb35683d72de21d70796a", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.9715639663278101, "ground_truth": 0}, {"key": "31d0ed7b1b8f65c6479fb35683d72de21d70796a", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.9834704421466678, "ground_truth": 0}, {"key": "31d0ed7b1b8f65c6479fb35683d72de21d70796a", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.9861513894540105, "ground_truth": 0}, {"key": "31d0ed7b1b8f65c6479fb35683d72de21d70796a", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.9795114464184901, "ground_truth": 0}, {"key": "b03ee4df6492038d0a1d99a1717d8ad8ccc06db3", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.7264255941827434, "ground_truth": 0}, {"key": "b03ee4df6492038d0a1d99a1717d8ad8ccc06db3", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.7386690635342626, "ground_truth": 0}, {"key": "b03ee4df6492038d0a1d99a1717d8ad8ccc06db3", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.7577943855440452, "ground_truth": 0}, {"key": "b03ee4df6492038d0a1d99a1717d8ad8ccc06db3", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.8732148211887784, "ground_truth": 0}, {"key": "b03ee4df6492038d0a1d99a1717d8ad8ccc06db3", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.7122321977304696, "ground_truth": 0}, {"key": "ad9abc78fb2de88267b854f2aed110e2a5b8c3f1", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.9787126474903328, "ground_truth": 0}, {"key": "ad9abc78fb2de88267b854f2aed110e2a5b8c3f1", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.9569571474104881, "ground_truth": 0}, {"key": "ad9abc78fb2de88267b854f2aed110e2a5b8c3f1", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.981453434988712, "ground_truth": 0}, {"key": "ad9abc78fb2de88267b854f2aed110e2a5b8c3f1", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.9744347862680789, "ground_truth": 0}, {"key": "ad9abc78fb2de88267b854f2aed110e2a5b8c3f1", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.9381240165508298, "ground_truth": 0}, {"key": "75cc16a7ba1970ba791da4ba43e6220f37f47697", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.9278878021681349, "ground_truth": 0}, {"key": "75cc16a7ba1970ba791da4ba43e6220f37f47697", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.9515039950547075, "ground_truth": 0}, {"key": "75cc16a7ba1970ba791da4ba43e6220f37f47697", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.8840392783420984, "ground_truth": 0}, {"key": "75cc16a7ba1970ba791da4ba43e6220f37f47697", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.9518632302832942, "ground_truth": 0}, {"key": "75cc16a7ba1970ba791da4ba43e6220f37f47697", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.9012274083158429, "ground_truth": 0}, {"key": "fe9d63d0ed719a42735cadaf10e76416545f680c", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.750552757955457, "ground_truth": 0}, {"key": "fe9d63d0ed719a42735cadaf10e76416545f680c", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.9111797125590791, "ground_truth": 0}, {"key": "fe9d63d0ed719a42735cadaf10e76416545f680c", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.8210441047588385, "ground_truth": 0}, {"key": "fe9d63d0ed719a42735cadaf10e76416545f680c", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.8832359869145799, "ground_truth": 0}, {"key": "fe9d63d0ed719a42735cadaf10e76416545f680c", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.8670357501559905, "ground_truth": 0}, {"key": "1744093a3fea8b8de0777b1a228c3ba3e515d48e", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.6548947529512472, "ground_truth": 0}, {"key": "1744093a3fea8b8de0777b1a228c3ba3e515d48e", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.7185943852349641, "ground_truth": 0}, {"key": "1744093a3fea8b8de0777b1a228c3ba3e515d48e", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.5888891250047753, "ground_truth": 0}, {"key": "1744093a3fea8b8de0777b1a228c3ba3e515d48e", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.45519859527150747, "ground_truth": 0}, {"key": "1744093a3fea8b8de0777b1a228c3ba3e515d48e", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.649578606780193, "ground_truth": 0}, {"key": "4929479f70e89deb22539e7d2caa6c33bbb0a14f", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.8031737822733107, "ground_truth": 0}, {"key": "4929479f70e89deb22539e7d2caa6c33bbb0a14f", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.6688802619794466, "ground_truth": 0}, {"key": "4929479f70e89deb22539e7d2caa6c33bbb0a14f", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.5794003910909317, "ground_truth": 0}, {"key": "4929479f70e89deb22539e7d2caa6c33bbb0a14f", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.8187367906082283, "ground_truth": 0}, {"key": "4929479f70e89deb22539e7d2caa6c33bbb0a14f", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.8221891308132522, "ground_truth": 0}, {"key": "4dd3bb1fe7a5b0d42f0df8d9e62b81c673475420", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.8244619322574347, "ground_truth": 0}, {"key": "4dd3bb1fe7a5b0d42f0df8d9e62b81c673475420", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.9284088021637538, "ground_truth": 0}, {"key": "4dd3bb1fe7a5b0d42f0df8d9e62b81c673475420", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.887204600711949, "ground_truth": 0}, {"key": "4dd3bb1fe7a5b0d42f0df8d9e62b81c673475420", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.8774767898383491, "ground_truth": 0}, {"key": "4dd3bb1fe7a5b0d42f0df8d9e62b81c673475420", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.8705972703411865, "ground_truth": 0}, {"key": "32f0c7b0845e88c7ff34bb9d358a86e029dc2261", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.7592254185463024, "ground_truth": 0}, {"key": "32f0c7b0845e88c7ff34bb9d358a86e029dc2261", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.7356416548959605, "ground_truth": 0}, {"key": "32f0c7b0845e88c7ff34bb9d358a86e029dc2261", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.7106282976683483, "ground_truth": 0}, {"key": "32f0c7b0845e88c7ff34bb9d358a86e029dc2261", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.6076631443423404, "ground_truth": 0}, {"key": "32f0c7b0845e88c7ff34bb9d358a86e029dc2261", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.6636689436716314, "ground_truth": 0}, {"key": "607ce3caeeac56d7c4250aaa161871535cd1251e", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.7592253996436574, "ground_truth": 0}, {"key": "607ce3caeeac56d7c4250aaa161871535cd1251e", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.7201715004026695, "ground_truth": 0}, {"key": "607ce3caeeac56d7c4250aaa161871535cd1251e", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.8092759763989726, "ground_truth": 0}, {"key": "607ce3caeeac56d7c4250aaa161871535cd1251e", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.8688267780405976, "ground_truth": 0}, {"key": "607ce3caeeac56d7c4250aaa161871535cd1251e", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.8895288512381374, "ground_truth": 0}, {"key": "7fb19f75d5d3feefeababf62d2ac91bf684a8038", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.9403530586131567, "ground_truth": 0}, {"key": "7fb19f75d5d3feefeababf62d2ac91bf684a8038", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.9385759587422576, "ground_truth": 0}, {"key": "7fb19f75d5d3feefeababf62d2ac91bf684a8038", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.9257686336145238, "ground_truth": 0}, {"key": "7fb19f75d5d3feefeababf62d2ac91bf684a8038", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.9130583404928811, "ground_truth": 0}, {"key": "7fb19f75d5d3feefeababf62d2ac91bf684a8038", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.931959573567751, "ground_truth": 0}, {"key": "4a70f83728ee66801be719df00060cda4c25817f", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.7732163627841221, "ground_truth": 0}, {"key": "4a70f83728ee66801be719df00060cda4c25817f", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.7264256067506311, "ground_truth": 0}, {"key": "4a70f83728ee66801be719df00060cda4c25817f", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.8479677549582887, "ground_truth": 0}, {"key": "4a70f83728ee66801be719df00060cda4c25817f", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.7690802415220788, "ground_truth": 0}, {"key": "4a70f83728ee66801be719df00060cda4c25817f", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.891811040949501, "ground_truth": 0}, {"key": "dcfc0e6ff732124026991e89d50727876f50351f", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.8128673235364354, "ground_truth": 0}, {"key": "dcfc0e6ff732124026991e89d50727876f50351f", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.8198933364596068, "ground_truth": 0}, {"key": "dcfc0e6ff732124026991e89d50727876f50351f", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.8679338572279321, "ground_truth": 0}, {"key": "dcfc0e6ff732124026991e89d50727876f50351f", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.7956581025567078, "ground_truth": 0}, {"key": "dcfc0e6ff732124026991e89d50727876f50351f", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.841825650306499, "ground_truth": 0}, {"key": "ace7f6d9e984397bda16bf441019f1584f036b2a", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.9840936085348628, "ground_truth": 0}, {"key": "ace7f6d9e984397bda16bf441019f1584f036b2a", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.971779013293004, "ground_truth": 0}, {"key": "ace7f6d9e984397bda16bf441019f1584f036b2a", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.9788748066577948, "ground_truth": 0}, {"key": "ace7f6d9e984397bda16bf441019f1584f036b2a", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.9780517436629896, "ground_truth": 0}, {"key": "ace7f6d9e984397bda16bf441019f1584f036b2a", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.946596666551036, "ground_truth": 0}, {"key": "6f12c9d47e70bfa86d72685d018ddd1161157e8e", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.8386797657380765, "ground_truth": 0}, {"key": "6f12c9d47e70bfa86d72685d018ddd1161157e8e", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.8587185820810026, "ground_truth": 0}, {"key": "6f12c9d47e70bfa86d72685d018ddd1161157e8e", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.8519528126048597, "ground_truth": 0}, {"key": "6f12c9d47e70bfa86d72685d018ddd1161157e8e", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.8652240862616453, "ground_truth": 0}, {"key": "6f12c9d47e70bfa86d72685d018ddd1161157e8e", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.8824278626269078, "ground_truth": 0}, {"key": "b32b72e5cf9e133e5be33eccbb2dc9ab5578ae84", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.7431680150373585, "ground_truth": 0}, {"key": "b32b72e5cf9e133e5be33eccbb2dc9ab5578ae84", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.7905303086203004, "ground_truth": 0}, {"key": "b32b72e5cf9e133e5be33eccbb2dc9ab5578ae84", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.8519528051495083, "ground_truth": 0}, {"key": "b32b72e5cf9e133e5be33eccbb2dc9ab5578ae84", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.7981867852723997, "ground_truth": 0}, {"key": "b32b72e5cf9e133e5be33eccbb2dc9ab5578ae84", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.837619975874114, "ground_truth": 0}, {"key": "0ae5e35dc2844afc251d082d8d5ef4be8edce58c", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.8910549532306937, "ground_truth": 0}, {"key": "0ae5e35dc2844afc251d082d8d5ef4be8edce58c", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.9588471149372251, "ground_truth": 0}, {"key": "0ae5e35dc2844afc251d082d8d5ef4be8edce58c", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.9178933681318376, "ground_truth": 0}, {"key": "0ae5e35dc2844afc251d082d8d5ef4be8edce58c", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.8984105517700328, "ground_truth": 0}, {"key": "0ae5e35dc2844afc251d082d8d5ef4be8edce58c", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.9473810441532773, "ground_truth": 0}, {"key": "ffb817ce85d7c19720ebbf0b43b01d0da61e9c06", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.6113819933459054, "ground_truth": 0}, {"key": "ffb817ce85d7c19720ebbf0b43b01d0da61e9c06", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.7416740149221527, "ground_truth": 0}, {"key": "ffb817ce85d7c19720ebbf0b43b01d0da61e9c06", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.7386690796482435, "ground_truth": 0}, {"key": "ffb817ce85d7c19720ebbf0b43b01d0da61e9c06", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.6150878309975345, "ground_truth": 0}, {"key": "ffb817ce85d7c19720ebbf0b43b01d0da61e9c06", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.684264023937728, "ground_truth": 0}, {"key": "9bfd6a5beb4e8dec59ba6d805dc9349a401da51d", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.798186778086794, "ground_truth": 0}, {"key": "9bfd6a5beb4e8dec59ba6d805dc9349a401da51d", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.6774740104020225, "ground_truth": 0}, {"key": "9bfd6a5beb4e8dec59ba6d805dc9349a401da51d", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.8976952961150189, "ground_truth": 0}, {"key": "9bfd6a5beb4e8dec59ba6d805dc9349a401da51d", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.7690802379090086, "ground_truth": 0}, {"key": "9bfd6a5beb4e8dec59ba6d805dc9349a401da51d", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.8596637324556632, "ground_truth": 0}, {"key": "dc7f4527bf654918c7a4bb19179949ecd5982c0f", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.9445872011393148, "ground_truth": 0}, {"key": "dc7f4527bf654918c7a4bb19179949ecd5982c0f", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.9661559678640911, "ground_truth": 0}, {"key": "dc7f4527bf654918c7a4bb19179949ecd5982c0f", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.950777882717242, "ground_truth": 0}, {"key": "dc7f4527bf654918c7a4bb19179949ecd5982c0f", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.927363295318452, "ground_truth": 0}, {"key": "dc7f4527bf654918c7a4bb19179949ecd5982c0f", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.958847113561636, "ground_truth": 0}, {"key": "c60e77736087bc85b372a28b4724aae6dcf0b052", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.6825737273766752, "ground_truth": 0}, {"key": "c60e77736087bc85b372a28b4724aae6dcf0b052", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.729519773963001, "ground_truth": 0}, {"key": "c60e77736087bc85b372a28b4724aae6dcf0b052", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.5409238496928321, "ground_truth": 0}, {"key": "c60e77736087bc85b372a28b4724aae6dcf0b052", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.6424324782363527, "ground_truth": 0}, {"key": "c60e77736087bc85b372a28b4724aae6dcf0b052", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.7446563558903778, "ground_truth": 0}, {"key": "e0953e2de7cf286ac1d87a41c62e37f21b7c7564", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.808067202498783, "ground_truth": 0}, {"key": "e0953e2de7cf286ac1d87a41c62e37f21b7c7564", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.7994423134601367, "ground_truth": 0}, {"key": "e0953e2de7cf286ac1d87a41c62e37f21b7c7564", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.7905303090526354, "ground_truth": 0}, {"key": "e0953e2de7cf286ac1d87a41c62e37f21b7c7564", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.814052793370338, "ground_truth": 0}, {"key": "e0953e2de7cf286ac1d87a41c62e37f21b7c7564", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.800691993117373, "ground_truth": 0}, {"key": "8b6f228661fd5f3170dc2c2e6b353e1d6c3859ec", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.7534666632470741, "ground_truth": 0}, {"key": "8b6f228661fd5f3170dc2c2e6b353e1d6c3859ec", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.8044059069367769, "ground_truth": 0}, {"key": "8b6f228661fd5f3170dc2c2e6b353e1d6c3859ec", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.8080672126008922, "ground_truth": 0}, {"key": "8b6f228661fd5f3170dc2c2e6b353e1d6c3859ec", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.6495786231556071, "ground_truth": 0}, {"key": "8b6f228661fd5f3170dc2c2e6b353e1d6c3859ec", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.7648916174680946, "ground_truth": 0}, {"key": "2f482e021caf07e2f07baf111c36d1587758f188", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.8539127478509577, "ground_truth": 0}, {"key": "2f482e021caf07e2f07baf111c36d1587758f188", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.8577681160677239, "ground_truth": 0}, {"key": "2f482e021caf07e2f07baf111c36d1587758f188", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.7931059361965072, "ground_truth": 0}, {"key": "2f482e021caf07e2f07baf111c36d1587758f188", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.8947894680669838, "ground_truth": 0}, {"key": "2f482e021caf07e2f07baf111c36d1587758f188", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.8895288568586932, "ground_truth": 0}, {"key": "dc8ce4207b91a323bf6e2fbab889efeed22aa428", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.6261241830498226, "ground_truth": 0}, {"key": "dc8ce4207b91a323bf6e2fbab889efeed22aa428", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.7008948172113771, "ground_truth": 0}, {"key": "dc8ce4207b91a323bf6e2fbab889efeed22aa428", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.7008948106287232, "ground_truth": 0}, {"key": "dc8ce4207b91a323bf6e2fbab889efeed22aa428", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.7772998645601823, "ground_truth": 0}, {"key": "dc8ce4207b91a323bf6e2fbab889efeed22aa428", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.7520125553058804, "ground_truth": 0}, {"key": "22a9005fe99c5dd536a4f41de4eb59d4f633ef9e", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.6926419932723505, "ground_truth": 0}, {"key": "22a9005fe99c5dd536a4f41de4eb59d4f633ef9e", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.8679338413502321, "ground_truth": 0}, {"key": "22a9005fe99c5dd536a4f41de4eb59d4f633ef9e", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.8732148253869785, "ground_truth": 0}, {"key": "22a9005fe99c5dd536a4f41de4eb59d4f633ef9e", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.8548846356073532, "ground_truth": 0}, {"key": "22a9005fe99c5dd536a4f41de4eb59d4f633ef9e", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.9026096028264302, "ground_truth": 0}, {"key": "1b00b2d2edef396855ad392f08a6e74550af569b", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.8624675272170539, "ground_truth": 0}, {"key": "1b00b2d2edef396855ad392f08a6e74550af569b", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.9184802457522845, "ground_truth": 0}, {"key": "1b00b2d2edef396855ad392f08a6e74550af569b", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.9252299499151188, "ground_truth": 0}, {"key": "1b00b2d2edef396855ad392f08a6e74550af569b", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.9053222934661762, "ground_truth": 0}, {"key": "1b00b2d2edef396855ad392f08a6e74550af569b", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.839733964652416, "ground_truth": 0}, {"key": "9b43472077873c45e7f278418885ad028eb993e3", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.6169358194899307, "ground_truth": 0}, {"key": "9b43472077873c45e7f278418885ad028eb993e3", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.6001883332294019, "ground_truth": 0}, {"key": "9b43472077873c45e7f278418885ad028eb993e3", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.6791786885689927, "ground_truth": 0}, {"key": "9b43472077873c45e7f278418885ad028eb993e3", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.6876299810646168, "ground_truth": 0}, {"key": "9b43472077873c45e7f278418885ad028eb993e3", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.7356416298670578, "ground_truth": 0}, {"key": "281347d0e99bc099d6991a6a60e30dc13d558216", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.78133061137426, "ground_truth": 0}, {"key": "281347d0e99bc099d6991a6a60e30dc13d558216", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.8824278722881463, "ground_truth": 0}, {"key": "281347d0e99bc099d6991a6a60e30dc13d558216", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.6959583118674295, "ground_truth": 0}, {"key": "281347d0e99bc099d6991a6a60e30dc13d558216", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.8807970787959944, "ground_truth": 0}, {"key": "281347d0e99bc099d6991a6a60e30dc13d558216", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.8140528125721762, "ground_truth": 0}, {"key": "703d248cce913a6036347aabd2ba011a7f660bf4", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.8459424357067229, "ground_truth": 0}, {"key": "703d248cce913a6036347aabd2ba011a7f660bf4", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.7138307255831497, "ground_truth": 0}, {"key": "703d248cce913a6036347aabd2ba011a7f660bf4", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.8955226751693337, "ground_truth": 0}, {"key": "703d248cce913a6036347aabd2ba011a7f660bf4", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.8895288561132264, "ground_truth": 0}, {"key": "703d248cce913a6036347aabd2ba011a7f660bf4", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.7969253772095028, "ground_truth": 0}, {"key": "517b86691dda04f41123354c1b7a7bfe1290eadc", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.786622841527695, "ground_truth": 0}, {"key": "517b86691dda04f41123354c1b7a7bfe1290eadc", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.7431679960191697, "ground_truth": 0}, {"key": "517b86691dda04f41123354c1b7a7bfe1290eadc", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.8376199697164646, "ground_truth": 0}, {"key": "517b86691dda04f41123354c1b7a7bfe1290eadc", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.770464790229611, "ground_truth": 0}, {"key": "517b86691dda04f41123354c1b7a7bfe1290eadc", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.7008948052640535, "ground_truth": 0}, {"key": "7b361feeebfb078b80831d40d2ad8640c361e049", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.9473810474726487, "ground_truth": 0}, {"key": "7b361feeebfb078b80831d40d2ad8640c361e049", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.9184802508568526, "ground_truth": 0}, {"key": "7b361feeebfb078b80831d40d2ad8640c361e049", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.9594592590971353, "ground_truth": 0}, {"key": "7b361feeebfb078b80831d40d2ad8640c361e049", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.855851144497999, "ground_truth": 0}, {"key": "7b361feeebfb078b80831d40d2ad8640c361e049", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.9039745068663491, "ground_truth": 0}, {"key": "7d8e196095e4561ee4f01c650101f5591fce4a8d", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.6113819903403322, "ground_truth": 0}, {"key": "7d8e196095e4561ee4f01c650101f5591fce4a8d", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.7325918451361799, "ground_truth": 0}, {"key": "7d8e196095e4561ee4f01c650101f5591fce4a8d", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.4921881422802026, "ground_truth": 0}, {"key": "7d8e196095e4561ee4f01c650101f5591fce4a8d", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.7074046863439434, "ground_truth": 0}, {"key": "7d8e196095e4561ee4f01c650101f5591fce4a8d", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.48633150914754436, "ground_truth": 0}, {"key": "ae03390949407f55c8d8f794896af3020d180b12", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.5888891455293724, "ground_truth": 0}, {"key": "ae03390949407f55c8d8f794896af3020d180b12", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.6206216005887883, "ground_truth": 0}, {"key": "ae03390949407f55c8d8f794896af3020d180b12", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.45713671560135405, "ground_truth": 0}, {"key": "ae03390949407f55c8d8f794896af3020d180b12", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.5717666052775217, "ground_truth": 0}, {"key": "ae03390949407f55c8d8f794896af3020d180b12", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.6406358686299722, "ground_truth": 0}, {"key": "4160464d3fcba547cb1664e54ce51ad06f78b773", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.9059898175613194, "ground_truth": 0}, {"key": "4160464d3fcba547cb1664e54ce51ad06f78b773", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.7074046936033636, "ground_truth": 0}, {"key": "4160464d3fcba547cb1664e54ce51ad06f78b773", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.8723473800532734, "ground_truth": 0}, {"key": "4160464d3fcba547cb1664e54ce51ad06f78b773", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.8766343873910633, "ground_truth": 0}, {"key": "4160464d3fcba547cb1664e54ce51ad06f78b773", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.8116760139157512, "ground_truth": 0}, {"key": "72b396634cc46f29b5ef146a61073ee7e7fa3cdc", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.9005297900459482, "ground_truth": 0}, {"key": "72b396634cc46f29b5ef146a61073ee7e7fa3cdc", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.9441768603334355, "ground_truth": 0}, {"key": "72b396634cc46f29b5ef146a61073ee7e7fa3cdc", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.9603611610604763, "ground_truth": 0}, {"key": "72b396634cc46f29b5ef146a61073ee7e7fa3cdc", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.9496693694649748, "ground_truth": 0}, {"key": "72b396634cc46f29b5ef146a61073ee7e7fa3cdc", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.9403530597152505, "ground_truth": 0}, {"key": "b9b09b290cdf4d74cb64684a6cae8b6832645607", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.9213576199812713, "ground_truth": 0}, {"key": "b9b09b290cdf4d74cb64684a6cae8b6832645607", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.9407897488916996, "ground_truth": 0}, {"key": "b9b09b290cdf4d74cb64684a6cae8b6832645607", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.8918110416624218, "ground_truth": 0}, {"key": "b9b09b290cdf4d74cb64684a6cae8b6832645607", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.8783142453146149, "ground_truth": 0}, {"key": "b9b09b290cdf4d74cb64684a6cae8b6832645607", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.8955226789386904, "ground_truth": 0}, {"key": "9e49d58fa5ab7f3e4356cb61337605ac007c49ca", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.4687906418777536, "ground_truth": 0}, {"key": "9e49d58fa5ab7f3e4356cb61337605ac007c49ca", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.7416740392242168, "ground_truth": 0}, {"key": "9e49d58fa5ab7f3e4356cb61337605ac007c49ca", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.6757646064542735, "ground_truth": 0}, {"key": "9e49d58fa5ab7f3e4356cb61337605ac007c49ca", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.5794004009779645, "ground_truth": 0}, {"key": "9e49d58fa5ab7f3e4356cb61337605ac007c49ca", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.6279512222553499, "ground_truth": 0}, {"key": "47fe0e2bba8206014fb53a7d5247efd1e316e087", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.7170118567734943, "ground_truth": 0}, {"key": "47fe0e2bba8206014fb53a7d5247efd1e316e087", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.7931059420788898, "ground_truth": 0}, {"key": "47fe0e2bba8206014fb53a7d5247efd1e316e087", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.5964331190348837, "ground_truth": 0}, {"key": "47fe0e2bba8206014fb53a7d5247efd1e316e087", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.8006919944342611, "ground_truth": 0}, {"key": "47fe0e2bba8206014fb53a7d5247efd1e316e087", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.4863315373802492, "ground_truth": 0}, {"key": "f54f84affaebd1d86011ad31adbf9fac4754a8f2", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.7676898532523203, "ground_truth": 0}, {"key": "f54f84affaebd1d86011ad31adbf9fac4754a8f2", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.727975431570586, "ground_truth": 0}, {"key": "f54f84affaebd1d86011ad31adbf9fac4754a8f2", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.8300437607761538, "ground_truth": 0}, {"key": "f54f84affaebd1d86011ad31adbf9fac4754a8f2", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.7431679960634503, "ground_truth": 0}, {"key": "f54f84affaebd1d86011ad31adbf9fac4754a8f2", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.8031737853007941, "ground_truth": 0}, {"key": "bc4992871e25e6584936af456ad4b819dcc52f27", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.8529354727820042, "ground_truth": 0}, {"key": "bc4992871e25e6584936af456ad4b819dcc52f27", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.8872046019576301, "ground_truth": 0}, {"key": "bc4992871e25e6584936af456ad4b819dcc52f27", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.8311430493324681, "ground_truth": 0}, {"key": "bc4992871e25e6584936af456ad4b819dcc52f27", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.8940517236460724, "ground_truth": 0}, {"key": "bc4992871e25e6584936af456ad4b819dcc52f27", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.8489721959536646, "ground_truth": 0}, {"key": "271416bf0f15c52a4417339de78dcecf378b3950", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.8962513704329508, "ground_truth": 0}, {"key": "271416bf0f15c52a4417339de78dcecf378b3950", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.9473810467675213, "ground_truth": 0}, {"key": "271416bf0f15c52a4417339de78dcecf378b3950", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.8723473771093875, "ground_truth": 0}, {"key": "271416bf0f15c52a4417339de78dcecf378b3950", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.798186773964824, "ground_truth": 0}, {"key": "271416bf0f15c52a4417339de78dcecf378b3950", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.8991213810592174, "ground_truth": 0}, {"key": "0add6b43e18072837f0bef41031d6f92f740d625", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.8019358215451386, "ground_truth": 0}, {"key": "0add6b43e18072837f0bef41031d6f92f740d625", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.7994423231243188, "ground_truth": 0}, {"key": "0add6b43e18072837f0bef41031d6f92f740d625", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.7577943635897635, "ground_truth": 0}, {"key": "0add6b43e18072837f0bef41031d6f92f740d625", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.7786493209873694, "ground_truth": 0}, {"key": "0add6b43e18072837f0bef41031d6f92f740d625", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.8489721945839971, "ground_truth": 0}, {"key": "7060e3feb685bda7b5102e1cc8e9b35da37ca2a1", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.8976953014556713, "ground_truth": 0}, {"key": "7060e3feb685bda7b5102e1cc8e9b35da37ca2a1", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.9066531267904259, "ground_truth": 0}, {"key": "7060e3feb685bda7b5102e1cc8e9b35da37ca2a1", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.8031737956003131, "ground_truth": 0}, {"key": "7060e3feb685bda7b5102e1cc8e9b35da37ca2a1", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.9224823371551706, "ground_truth": 0}, {"key": "7060e3feb685bda7b5102e1cc8e9b35da37ca2a1", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.7931059267891436, "ground_truth": 0}, {"key": "04fbd3088e8610dd4d5bea709e7cc5ee3e53710d", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.8688267703892796, "ground_truth": 0}, {"key": "04fbd3088e8610dd4d5bea709e7cc5ee3e53710d", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.8140527944444343, "ground_truth": 0}, {"key": "04fbd3088e8610dd4d5bea709e7cc5ee3e53710d", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.8418256444458413, "ground_truth": 0}, {"key": "04fbd3088e8610dd4d5bea709e7cc5ee3e53710d", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.8633915979259722, "ground_truth": 0}, {"key": "04fbd3088e8610dd4d5bea709e7cc5ee3e53710d", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.7122321878473776, "ground_truth": 0}, {"key": "b198f0356c0f0cb09aba4d7d5541dd7c5ce91678", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.7994423186772507, "ground_truth": 0}, {"key": "b198f0356c0f0cb09aba4d7d5541dd7c5ce91678", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.9284088021637538, "ground_truth": 0}, {"key": "b198f0356c0f0cb09aba4d7d5541dd7c5ce91678", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.8596637529716634, "ground_truth": 0}, {"key": "b198f0356c0f0cb09aba4d7d5541dd7c5ce91678", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.8962513709463814, "ground_truth": 0}, {"key": "b198f0356c0f0cb09aba4d7d5541dd7c5ce91678", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.8705972703411865, "ground_truth": 0}, {"key": "0f60442453e038c6bbe3aa525bedf2a97f459e04", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.8278281509600653, "ground_truth": 0}, {"key": "0f60442453e038c6bbe3aa525bedf2a97f459e04", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.7386690499637891, "ground_truth": 0}, {"key": "0f60442453e038c6bbe3aa525bedf2a97f459e04", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.7786492988113372, "ground_truth": 0}, {"key": "0f60442453e038c6bbe3aa525bedf2a97f459e04", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.9196425355028475, "ground_truth": 0}, {"key": "0f60442453e038c6bbe3aa525bedf2a97f459e04", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.9376689645972128, "ground_truth": 0}, {"key": "79b423b90af6b3381ebfa34a7382ca472bdb5b35", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.8864204091129869, "ground_truth": 0}, {"key": "79b423b90af6b3381ebfa34a7382ca472bdb5b35", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.5660185261919557, "ground_truth": 0}, {"key": "79b423b90af6b3381ebfa34a7382ca472bdb5b35", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.8175744647173198, "ground_truth": 0}, {"key": "79b423b90af6b3381ebfa34a7382ca472bdb5b35", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.6334102538836262, "ground_truth": 0}, {"key": "79b423b90af6b3381ebfa34a7382ca472bdb5b35", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.7264256101087554, "ground_truth": 0}, {"key": "3e5a3a2dddee7ebebe57c12d0ace97a24cbabd72", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.8887587840114523, "ground_truth": 0}, {"key": "3e5a3a2dddee7ebebe57c12d0ace97a24cbabd72", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.9079671391247499, "ground_truth": 0}, {"key": "3e5a3a2dddee7ebebe57c12d0ace97a24cbabd72", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.8558511435783603, "ground_truth": 0}, {"key": "3e5a3a2dddee7ebebe57c12d0ace97a24cbabd72", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.7759445439361409, "ground_truth": 0}, {"key": "3e5a3a2dddee7ebebe57c12d0ace97a24cbabd72", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.9252299490125475, "ground_truth": 0}, {"key": "c623e4914c04811d354fa137e3bf7a00980ef7d7", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.8187367893801379, "ground_truth": 0}, {"key": "c623e4914c04811d354fa137e3bf7a00980ef7d7", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.8322366445981857, "ground_truth": 0}, {"key": "c623e4914c04811d354fa137e3bf7a00980ef7d7", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.7577943621262638, "ground_truth": 0}, {"key": "c623e4914c04811d354fa137e3bf7a00980ef7d7", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.677473998350547, "ground_truth": 0}, {"key": "c623e4914c04811d354fa137e3bf7a00980ef7d7", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.7008947968082444, "ground_truth": 0}, {"key": "d5ef1fb6f2df20e46fb032b9e318bc8555283e78", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.7879311997746378, "ground_truth": 0}, {"key": "d5ef1fb6f2df20e46fb032b9e318bc8555283e78", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.9278878004610371, "ground_truth": 0}, {"key": "d5ef1fb6f2df20e46fb032b9e318bc8555283e78", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.7853085803599054, "ground_truth": 0}, {"key": "d5ef1fb6f2df20e46fb032b9e318bc8555283e78", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.7461389825741248, "ground_truth": 0}, {"key": "d5ef1fb6f2df20e46fb032b9e318bc8555283e78", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.9190632870855969, "ground_truth": 0}, {"key": "e1a36c50adadc5db9ffe6fd2c5e275d522902193", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.903974509346443, "ground_truth": 0}, {"key": "e1a36c50adadc5db9ffe6fd2c5e275d522902193", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.9224823447009692, "ground_truth": 0}, {"key": "e1a36c50adadc5db9ffe6fd2c5e275d522902193", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.870597265019901, "ground_truth": 0}, {"key": "e1a36c50adadc5db9ffe6fd2c5e275d522902193", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.9178933718651586, "ground_truth": 0}, {"key": "e1a36c50adadc5db9ffe6fd2c5e275d522902193", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.9005297903783246, "ground_truth": 0}, {"key": "bad69c9a3c7d84a4717705a3063dd7367243772b", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.8267117861058833, "ground_truth": 0}, {"key": "bad69c9a3c7d84a4717705a3063dd7367243772b", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.8732148271420623, "ground_truth": 0}, {"key": "bad69c9a3c7d84a4717705a3063dd7367243772b", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.8832359864373787, "ground_truth": 0}, {"key": "bad69c9a3c7d84a4717705a3063dd7367243772b", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.7446563331835891, "ground_truth": 0}, {"key": "bad69c9a3c7d84a4717705a3063dd7367243772b", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.8365545621583161, "ground_truth": 0}, {"key": "4b40ad1f0e59b139e9a1466859ee08a048ca8d2c", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.8732148250097516, "ground_truth": 0}, {"key": "4b40ad1f0e59b139e9a1466859ee08a048ca8d2c", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.9224823428372053, "ground_truth": 0}, {"key": "4b40ad1f0e59b139e9a1466859ee08a048ca8d2c", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.8210440923998608, "ground_truth": 0}, {"key": "4b40ad1f0e59b139e9a1466859ee08a048ca8d2c", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.821044111249372, "ground_truth": 0}, {"key": "4b40ad1f0e59b139e9a1466859ee08a048ca8d2c", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.946200356859849, "ground_truth": 0}, {"key": "c17a30b4c0f8f58e3afa6279a39470f65a179f6b", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.8824278624952505, "ground_truth": 0}, {"key": "c17a30b4c0f8f58e3afa6279a39470f65a179f6b", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.831143052408236, "ground_truth": 0}, {"key": "c17a30b4c0f8f58e3afa6279a39470f65a179f6b", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.7866228413455062, "ground_truth": 0}, {"key": "c17a30b4c0f8f58e3afa6279a39470f65a179f6b", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.746138986450647, "ground_truth": 0}, {"key": "c17a30b4c0f8f58e3afa6279a39470f65a179f6b", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.8469578432664537, "ground_truth": 0}, {"key": "6f579aad2d1f601b17e01057cd4b5e4942627230", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.7879312109318487, "ground_truth": 0}, {"key": "6f579aad2d1f601b17e01057cd4b5e4942627230", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.6943026806904141, "ground_truth": 0}, {"key": "6f579aad2d1f601b17e01057cd4b5e4942627230", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.6909762955485325, "ground_truth": 0}, {"key": "6f579aad2d1f601b17e01057cd4b5e4942627230", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.7853085988999121, "ground_truth": 0}, {"key": "6f579aad2d1f601b17e01057cd4b5e4942627230", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.7279754598325782, "ground_truth": 0}, {"key": "7551f8e13485bb1738c16eccad343a14a47b2903", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.8864204095087599, "ground_truth": 0}, {"key": "7551f8e13485bb1738c16eccad343a14a47b2903", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.8577681216174178, "ground_truth": 0}, {"key": "7551f8e13485bb1738c16eccad343a14a47b2903", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.8344069019680959, "ground_truth": 0}, {"key": "7551f8e13485bb1738c16eccad343a14a47b2903", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.8832359894847488, "ground_truth": 0}, {"key": "7551f8e13485bb1738c16eccad343a14a47b2903", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.7341195390920986, "ground_truth": 0}, {"key": "257d8d38863175ec9401d0532963fb71a47f0734", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.8783142496415965, "ground_truth": 0}, {"key": "257d8d38863175ec9401d0532963fb71a47f0734", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.7461389786388777, "ground_truth": 0}, {"key": "257d8d38863175ec9401d0532963fb71a47f0734", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.8397339628923711, "ground_truth": 0}, {"key": "257d8d38863175ec9401d0532963fb71a47f0734", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.8587185771491609, "ground_truth": 0}, {"key": "257d8d38863175ec9401d0532963fb71a47f0734", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.7799929085392308, "ground_truth": 0}, {"key": "aa596e10dfe78dd875a7e15bfd53138bc8bde471", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.7341195272434746, "ground_truth": 0}, {"key": "aa596e10dfe78dd875a7e15bfd53138bc8bde471", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.6959583139432459, "ground_truth": 0}, {"key": "aa596e10dfe78dd875a7e15bfd53138bc8bde471", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.7839884748310829, "ground_truth": 0}, {"key": "aa596e10dfe78dd875a7e15bfd53138bc8bde471", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.7520125621143819, "ground_truth": 0}, {"key": "aa596e10dfe78dd875a7e15bfd53138bc8bde471", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.6926419836716331, "ground_truth": 0}, {"key": "a0dff972172125f32b79977a47b0d250be8f71e4", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.9066531226583271, "ground_truth": 0}, {"key": "a0dff972172125f32b79977a47b0d250be8f71e4", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.9621075761794243, "ground_truth": 0}, {"key": "a0dff972172125f32b79977a47b0d250be8f71e4", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.8606036188667415, "ground_truth": 0}, {"key": "a0dff972172125f32b79977a47b0d250be8f71e4", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.8449215256248557, "ground_truth": 0}, {"key": "a0dff972172125f32b79977a47b0d250be8f71e4", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.888758786834255, "ground_truth": 0}, {"key": "faac3a6337907b1552b7068c8701cae665c4885c", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.8140527891321856, "ground_truth": 0}, {"key": "faac3a6337907b1552b7068c8701cae665c4885c", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.8587185794618964, "ground_truth": 0}, {"key": "faac3a6337907b1552b7068c8701cae665c4885c", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.7943849568005253, "ground_truth": 0}, {"key": "faac3a6337907b1552b7068c8701cae665c4885c", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.8509646979372422, "ground_truth": 0}, {"key": "faac3a6337907b1552b7068c8701cae665c4885c", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.8991213779950884, "ground_truth": 0}, {"key": "c741b211364d761605050776064a506d24378d10", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.7892337033559108, "ground_truth": 0}, {"key": "c741b211364d761605050776064a506d24378d10", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.6477982106970915, "ground_truth": 0}, {"key": "c741b211364d761605050776064a506d24378d10", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.4054487133703776, "ground_truth": 0}, {"key": "c741b211364d761605050776064a506d24378d10", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.7549149876896748, "ground_truth": 0}, {"key": "c741b211364d761605050776064a506d24378d10", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.6876299856441755, "ground_truth": 0}, {"key": "a062b8ba08369be2364a863020a28de63a3cbf86", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.8019358184452524, "ground_truth": 0}, {"key": "a062b8ba08369be2364a863020a28de63a3cbf86", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.8322366596212624, "ground_truth": 0}, {"key": "a062b8ba08369be2364a863020a28de63a3cbf86", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.8116760089429057, "ground_truth": 0}, {"key": "a062b8ba08369be2364a863020a28de63a3cbf86", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.8643104518882891, "ground_truth": 0}, {"key": "a062b8ba08369be2364a863020a28de63a3cbf86", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.7969253822048468, "ground_truth": 0}, {"key": "f11102404d23702fe398b1d690d13418703e617a", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.9637799423981639, "ground_truth": 0}, {"key": "f11102404d23702fe398b1d690d13418703e617a", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.9645892708408249, "ground_truth": 0}, {"key": "f11102404d23702fe398b1d690d13418703e617a", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.9658995734691445, "ground_truth": 0}, {"key": "f11102404d23702fe398b1d690d13418703e617a", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.9635062296635903, "ground_truth": 0}, {"key": "f11102404d23702fe398b1d690d13418703e617a", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.9764905479730304, "ground_truth": 0}, {"key": "62481fda7e7b9714b994617909349550707fe8a7", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.7759445726584064, "ground_truth": 0}, {"key": "62481fda7e7b9714b994617909349550707fe8a7", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.8740772231024732, "ground_truth": 0}, {"key": "62481fda7e7b9714b994617909349550707fe8a7", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.8902942257394435, "ground_truth": 0}, {"key": "62481fda7e7b9714b994617909349550707fe8a7", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.8221891207032154, "ground_truth": 0}, {"key": "62481fda7e7b9714b994617909349550707fe8a7", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.879146761471938, "ground_truth": 0}, {"key": "13943ef2d9c3b737c9a900f0cdb32a9c39121e6f", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.9136765233783412, "ground_truth": 0}, {"key": "13943ef2d9c3b737c9a900f0cdb32a9c39121e6f", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.8688267837635171, "ground_truth": 0}, {"key": "13943ef2d9c3b737c9a900f0cdb32a9c39121e6f", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.9263037303050092, "ground_truth": 0}, {"key": "13943ef2d9c3b737c9a900f0cdb32a9c39121e6f", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.9445872047320037, "ground_truth": 0}, {"key": "13943ef2d9c3b737c9a900f0cdb32a9c39121e6f", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.9079671381659358, "ground_truth": 0}, {"key": "0c25e0cd62589fde1b378606febbcc5a2bafc770", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.9334308147030175, "ground_truth": 0}, {"key": "0c25e0cd62589fde1b378606febbcc5a2bafc770", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.8864204077298149, "ground_truth": 0}, {"key": "0c25e0cd62589fde1b378606febbcc5a2bafc770", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.9167080770136097, "ground_truth": 0}, {"key": "0c25e0cd62589fde1b378606febbcc5a2bafc770", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.8596637496204935, "ground_truth": 0}, {"key": "0c25e0cd62589fde1b378606febbcc5a2bafc770", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.9099070043572512, "ground_truth": 0}, {"key": "a86bc16fad35d84e988af4cc64bf14877337d47e", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.8791467664790164, "ground_truth": 0}, {"key": "a86bc16fad35d84e988af4cc64bf14877337d47e", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.8824278639245657, "ground_truth": 0}, {"key": "a86bc16fad35d84e988af4cc64bf14877337d47e", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.7905303116053632, "ground_truth": 0}, {"key": "a86bc16fad35d84e988af4cc64bf14877337d47e", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.8499711777937646, "ground_truth": 0}, {"key": "a86bc16fad35d84e988af4cc64bf14877337d47e", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.7839884639394643, "ground_truth": 0}, {"key": "0f937bcc8cd07bab2d5aa9a4492d3c2430063b67", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.846957844666608, "ground_truth": 0}, {"key": "0f937bcc8cd07bab2d5aa9a4492d3c2430063b67", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.6876299875509438, "ground_truth": 0}, {"key": "0f937bcc8cd07bab2d5aa9a4492d3c2430063b67", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.903294201862112, "ground_truth": 0}, {"key": "0f937bcc8cd07bab2d5aa9a4492d3c2430063b67", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.8661325150403584, "ground_truth": 0}, {"key": "0f937bcc8cd07bab2d5aa9a4492d3c2430063b67", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.8344068803190858, "ground_truth": 0}, {"key": "a6c0617d92807f05f02d767261c45b616382e499", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.85966375716165, "ground_truth": 0}, {"key": "a6c0617d92807f05f02d767261c45b616382e499", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.8799743682464743, "ground_truth": 0}, {"key": "a6c0617d92807f05f02d767261c45b616382e499", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.4921881292020226, "ground_truth": 0}, {"key": "a6c0617d92807f05f02d767261c45b616382e499", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.8019358275515507, "ground_truth": 0}, {"key": "a6c0617d92807f05f02d767261c45b616382e499", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.8128673104243835, "ground_truth": 0}, {"key": "4f45a0576d353fa9b5b9d1c8e3cc0e6a1cd4897b", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.7154240025483504, "ground_truth": 0}, {"key": "4f45a0576d353fa9b5b9d1c8e3cc0e6a1cd4897b", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.8233283958356311, "ground_truth": 0}, {"key": "4f45a0576d353fa9b5b9d1c8e3cc0e6a1cd4897b", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.7264256102467967, "ground_truth": 0}, {"key": "4f45a0576d353fa9b5b9d1c8e3cc0e6a1cd4897b", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.7431680000125547, "ground_truth": 0}, {"key": "4f45a0576d353fa9b5b9d1c8e3cc0e6a1cd4897b", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.891054955311975, "ground_truth": 0}, {"key": "f6d43a207c2b3c48e787087b345c23d2fb1dc92f", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.9092645183231705, "ground_truth": 0}, {"key": "f6d43a207c2b3c48e787087b345c23d2fb1dc92f", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.876634388388585, "ground_truth": 0}, {"key": "f6d43a207c2b3c48e787087b345c23d2fb1dc92f", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.7892336994426559, "ground_truth": 0}, {"key": "f6d43a207c2b3c48e787087b345c23d2fb1dc92f", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.8438950946421148, "ground_truth": 0}, {"key": "f6d43a207c2b3c48e787087b345c23d2fb1dc92f", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.9059898167241998, "ground_truth": 0}, {"key": "e0127487aee3a00fe164d72eb697221079518471", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.9190632865808153, "ground_truth": 0}, {"key": "e0127487aee3a00fe164d72eb697221079518471", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.9130583430565815, "ground_truth": 0}, {"key": "e0127487aee3a00fe164d72eb697221079518471", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.8840392866446003, "ground_truth": 0}, {"key": "e0127487aee3a00fe164d72eb697221079518471", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.9429285975321411, "ground_truth": 0}, {"key": "e0127487aee3a00fe164d72eb697221079518471", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.9385759581322305, "ground_truth": 0}, {"key": "2f3af8decce1c0a6cd22b21df96acd40b14bb62b", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.5964331445217694, "ground_truth": 0}, {"key": "2f3af8decce1c0a6cd22b21df96acd40b14bb62b", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.702530044791103, "ground_truth": 0}, {"key": "2f3af8decce1c0a6cd22b21df96acd40b14bb62b", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.5486734845391043, "ground_truth": 0}, {"key": "2f3af8decce1c0a6cd22b21df96acd40b14bb62b", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.6169358250187358, "ground_truth": 0}, {"key": "2f3af8decce1c0a6cd22b21df96acd40b14bb62b", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.6370307969646417, "ground_truth": 0}, {"key": "13a366f303e6ea2f07c353a9f5fb49a44840f808", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.9184802506263928, "ground_truth": 0}, {"key": "13a366f303e6ea2f07c353a9f5fb49a44840f808", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.8864204087586631, "ground_truth": 0}, {"key": "13a366f303e6ea2f07c353a9f5fb49a44840f808", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.8428631521644995, "ground_truth": 0}, {"key": "13a366f303e6ea2f07c353a9f5fb49a44840f808", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.8558511497175004, "ground_truth": 0}, {"key": "13a366f303e6ea2f07c353a9f5fb49a44840f808", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.9105453985484044, "ground_truth": 0}, {"key": "ee36a8b5db09b9e9a6d462116539ffc095d5c017", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.5717666008631519, "ground_truth": 0}, {"key": "ee36a8b5db09b9e9a6d462116539ffc095d5c017", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.7676898373479033, "ground_truth": 0}, {"key": "ee36a8b5db09b9e9a6d462116539ffc095d5c017", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.726425596957599, "ground_truth": 0}, {"key": "ee36a8b5db09b9e9a6d462116539ffc095d5c017", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.7981867770720942, "ground_truth": 0}, {"key": "ee36a8b5db09b9e9a6d462116539ffc095d5c017", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.7905302956192668, "ground_truth": 0}, {"key": "d3b3bcf90226a694361cb27f1a4d481c79b7368a", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.8568122967374647, "ground_truth": 0}, {"key": "d3b3bcf90226a694361cb27f1a4d481c79b7368a", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.8397339819453978, "ground_truth": 0}, {"key": "d3b3bcf90226a694361cb27f1a4d481c79b7368a", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.8459424285079734, "ground_truth": 0}, {"key": "d3b3bcf90226a694361cb27f1a4d481c79b7368a", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.907312222618208, "ground_truth": 0}, {"key": "d3b3bcf90226a694361cb27f1a4d481c79b7368a", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.8824278671014167, "ground_truth": 0}, {"key": "e5e837f2cc75fc44ebf826822aa4c9dc59344b8b", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.6352224281605977, "ground_truth": 0}, {"key": "e5e837f2cc75fc44ebf826822aa4c9dc59344b8b", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.825589721754823, "ground_truth": 0}, {"key": "e5e837f2cc75fc44ebf826822aa4c9dc59344b8b", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.6261241870056826, "ground_truth": 0}, {"key": "e5e837f2cc75fc44ebf826822aa4c9dc59344b8b", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.6370308167981852, "ground_truth": 0}, {"key": "e5e837f2cc75fc44ebf826822aa4c9dc59344b8b", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.6601723746640283, "ground_truth": 0}, {"key": "1317a869cc1d6d534a93eaad67fb6550aa155ae6", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.8832359868710548, "ground_truth": 0}, {"key": "1317a869cc1d6d534a93eaad67fb6550aa155ae6", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.7799929059931711, "ground_truth": 0}, {"key": "1317a869cc1d6d534a93eaad67fb6550aa155ae6", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.8080672062600534, "ground_truth": 0}, {"key": "1317a869cc1d6d534a93eaad67fb6550aa155ae6", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.8140527972436963, "ground_truth": 0}, {"key": "1317a869cc1d6d534a93eaad67fb6550aa155ae6", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.8643104572121532, "ground_truth": 0}, {"key": "f856ca4cd15992e0e88ae9113bf31b2a5ab55072", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.9178933666808146, "ground_truth": 0}, {"key": "f856ca4cd15992e0e88ae9113bf31b2a5ab55072", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.9105454018631954, "ground_truth": 0}, {"key": "f856ca4cd15992e0e88ae9113bf31b2a5ab55072", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.9314625047744617, "ground_truth": 0}, {"key": "f856ca4cd15992e0e88ae9113bf31b2a5ab55072", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.9252299500172212, "ground_truth": 0}, {"key": "f856ca4cd15992e0e88ae9113bf31b2a5ab55072", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.8428631583628714, "ground_truth": 0}, {"key": "438e8eaa1c64cb59288f9954355d0100181d19a2", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.8799743628991271, "ground_truth": 0}, {"key": "438e8eaa1c64cb59288f9954355d0100181d19a2", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.8577681154634283, "ground_truth": 0}, {"key": "438e8eaa1c64cb59288f9954355d0100181d19a2", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.8322366462381515, "ground_truth": 0}, {"key": "438e8eaa1c64cb59288f9954355d0100181d19a2", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.7994423063201438, "ground_truth": 0}, {"key": "438e8eaa1c64cb59288f9954355d0100181d19a2", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.7931059619830495, "ground_truth": 0}, {"key": "470618f9fd48a5d134a44b5de166b625f596a0b3", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.8558511417956551, "ground_truth": 0}, {"key": "470618f9fd48a5d134a44b5de166b625f596a0b3", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.8459424345212564, "ground_truth": 0}, {"key": "470618f9fd48a5d134a44b5de166b625f596a0b3", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.8895288532691883, "ground_truth": 0}, {"key": "470618f9fd48a5d134a44b5de166b625f596a0b3", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.9433475766891435, "ground_truth": 0}, {"key": "470618f9fd48a5d134a44b5de166b625f596a0b3", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.9367494767463381, "ground_truth": 0}, {"key": "751e8f720d24c57e79cf63d9a3f72cd80c5d9619", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.814052794116594, "ground_truth": 0}, {"key": "751e8f720d24c57e79cf63d9a3f72cd80c5d9619", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.8766343796399728, "ground_truth": 0}, {"key": "751e8f720d24c57e79cf63d9a3f72cd80c5d9619", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.7799928927585366, "ground_truth": 0}, {"key": "751e8f720d24c57e79cf63d9a3f72cd80c5d9619", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.8732148231052407, "ground_truth": 0}, {"key": "751e8f720d24c57e79cf63d9a3f72cd80c5d9619", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.8278281418511115, "ground_truth": 0}, {"key": "6a985a1090f146976d33c8b33342320a65a50211", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.8289388231216407, "ground_truth": 0}, {"key": "6a985a1090f146976d33c8b33342320a65a50211", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.8244619221320645, "ground_truth": 0}, {"key": "6a985a1090f146976d33c8b33342320a65a50211", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.6808786111049939, "ground_truth": 0}, {"key": "6a985a1090f146976d33c8b33342320a65a50211", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.846957844322213, "ground_truth": 0}, {"key": "6a985a1090f146976d33c8b33342320a65a50211", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.7505527705844997, "ground_truth": 0}, {"key": "4640d2f968f31bcf384d8253e055611b10f4a38b", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.7786493062479707, "ground_truth": 0}, {"key": "4640d2f968f31bcf384d8253e055611b10f4a38b", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.6893056165832308, "ground_truth": 0}, {"key": "4640d2f968f31bcf384d8253e055611b10f4a38b", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.8479677590310847, "ground_truth": 0}, {"key": "4640d2f968f31bcf384d8253e055611b10f4a38b", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.6334102542730242, "ground_truth": 0}, {"key": "4640d2f968f31bcf384d8253e055611b10f4a38b", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.6976089022505917, "ground_truth": 0}, {"key": "22e0c9ba3465840583a5fd79714d2f7663c7e3a1", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.8596637428407062, "ground_truth": 0}, {"key": "22e0c9ba3465840583a5fd79714d2f7663c7e3a1", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.8679338440700995, "ground_truth": 0}, {"key": "22e0c9ba3465840583a5fd79714d2f7663c7e3a1", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.8840392798275798, "ground_truth": 0}, {"key": "22e0c9ba3465840583a5fd79714d2f7663c7e3a1", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.8757869935004942, "ground_truth": 0}, {"key": "22e0c9ba3465840583a5fd79714d2f7663c7e3a1", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.8397339608811736, "ground_truth": 0}, {"key": "10dafcc21761c60f8fc5bd832daf8f21cf0fc66d", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.7931059384121145, "ground_truth": 0}, {"key": "10dafcc21761c60f8fc5bd832daf8f21cf0fc66d", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.8509646978173812, "ground_truth": 0}, {"key": "10dafcc21761c60f8fc5bd832daf8f21cf0fc66d", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.8244619315517013, "ground_truth": 0}, {"key": "10dafcc21761c60f8fc5bd832daf8f21cf0fc66d", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.7918210587720842, "ground_truth": 0}, {"key": "10dafcc21761c60f8fc5bd832daf8f21cf0fc66d", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.8732148268426061, "ground_truth": 0}, {"key": "75da85a72e0028e1b07c65f6b771a1eaa20b4e04", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.7772998489469359, "ground_truth": 0}, {"key": "75da85a72e0028e1b07c65f6b771a1eaa20b4e04", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.7476159473346631, "ground_truth": 0}, {"key": "75da85a72e0028e1b07c65f6b771a1eaa20b4e04", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.8596637423718425, "ground_truth": 0}, {"key": "75da85a72e0028e1b07c65f6b771a1eaa20b4e04", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.766293641677206, "ground_truth": 0}, {"key": "75da85a72e0028e1b07c65f6b771a1eaa20b4e04", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.8519528056400596, "ground_truth": 0}, {"key": "9166b4c77e919f7a7cc457f9df981512dea3694f", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.8652240898937317, "ground_truth": 0}, {"key": "9166b4c77e919f7a7cc457f9df981512dea3694f", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.7217432074060877, "ground_truth": 0}, {"key": "9166b4c77e919f7a7cc457f9df981512dea3694f", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.8407825968874466, "ground_truth": 0}, {"key": "9166b4c77e919f7a7cc457f9df981512dea3694f", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.8998277755121623, "ground_truth": 0}, {"key": "9166b4c77e919f7a7cc457f9df981512dea3694f", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.7853085850551407, "ground_truth": 0}, {"key": "81e50c6cdbea4e55af6307d653135ef395b6d7fe", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.9118099596671252, "ground_truth": 0}, {"key": "81e50c6cdbea4e55af6307d653135ef395b6d7fe", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.954984467735337, "ground_truth": 0}, {"key": "81e50c6cdbea4e55af6307d653135ef395b6d7fe", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.901227404540323, "ground_truth": 0}, {"key": "81e50c6cdbea4e55af6307d653135ef395b6d7fe", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.8344068735320236, "ground_truth": 0}, {"key": "81e50c6cdbea4e55af6307d653135ef395b6d7fe", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.9485372340786145, "ground_truth": 0}, {"key": "59fa6c3439d216272cc845d35627f8eb11b08a6d", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.9600626819172647, "ground_truth": 0}, {"key": "59fa6c3439d216272cc845d35627f8eb11b08a6d", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.9683812332760496, "ground_truth": 0}, {"key": "59fa6c3439d216272cc845d35627f8eb11b08a6d", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.9376689640144011, "ground_truth": 0}, {"key": "59fa6c3439d216272cc845d35627f8eb11b08a6d", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.971129090521133, "ground_truth": 0}, {"key": "59fa6c3439d216272cc845d35627f8eb11b08a6d", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.9504109761768902, "ground_truth": 0}, {"key": "2eff3ba44cfaefbff89ebc764828ae9e4d477c9b", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.9539660974594237, "ground_truth": 0}, {"key": "2eff3ba44cfaefbff89ebc764828ae9e4d477c9b", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.9728307656786482, "ground_truth": 0}, {"key": "2eff3ba44cfaefbff89ebc764828ae9e4d477c9b", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.9202179863022106, "ground_truth": 0}, {"key": "2eff3ba44cfaefbff89ebc764828ae9e4d477c9b", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.9635062319675805, "ground_truth": 0}, {"key": "2eff3ba44cfaefbff89ebc764828ae9e4d477c9b", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.9469902250713883, "ground_truth": 0}, {"key": "74698ee383888faf5a49b32ecb8211b888270b76", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.8080672047402839, "ground_truth": 0}, {"key": "74698ee383888faf5a49b32ecb8211b888270b76", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.9111797115066399, "ground_truth": 0}, {"key": "74698ee383888faf5a49b32ecb8211b888270b76", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.8661325147663844, "ground_truth": 0}, {"key": "74698ee383888faf5a49b32ecb8211b888270b76", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.8407826035766857, "ground_truth": 0}, {"key": "74698ee383888faf5a49b32ecb8211b888270b76", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.7879311880948635, "ground_truth": 0}, {"key": "79a6d24f452d8c1cef47ab224fd2083b0d08324c", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.9066531250227574, "ground_truth": 0}, {"key": "79a6d24f452d8c1cef47ab224fd2083b0d08324c", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.9348724508546031, "ground_truth": 0}, {"key": "79a6d24f452d8c1cef47ab224fd2083b0d08324c", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.8902942313750409, "ground_truth": 0}, {"key": "79a6d24f452d8c1cef47ab224fd2083b0d08324c", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.8816149142583408, "ground_truth": 0}, {"key": "79a6d24f452d8c1cef47ab224fd2083b0d08324c", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.9462003514595472, "ground_truth": 0}, {"key": "50f2041a2bed7f316d3254192c4158095eeec2e9", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.8255897361247568, "ground_truth": 0}, {"key": "50f2041a2bed7f316d3254192c4158095eeec2e9", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.8489722011925892, "ground_truth": 0}, {"key": "50f2041a2bed7f316d3254192c4158095eeec2e9", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.8311430385215363, "ground_truth": 0}, {"key": "50f2041a2bed7f316d3254192c4158095eeec2e9", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.8233283825460254, "ground_truth": 0}, {"key": "50f2041a2bed7f316d3254192c4158095eeec2e9", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.7826624749326586, "ground_truth": 0}, {"key": "de6ed8db6d639706f2c5015c699fc578e4aa43ec", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.837619975140335, "ground_truth": 0}, {"key": "de6ed8db6d639706f2c5015c699fc578e4aa43ec", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.9252299511076831, "ground_truth": 0}, {"key": "de6ed8db6d639706f2c5015c699fc578e4aa43ec", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.9299510379123959, "ground_truth": 0}, {"key": "de6ed8db6d639706f2c5015c699fc578e4aa43ec", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.8479677529719617, "ground_truth": 0}, {"key": "de6ed8db6d639706f2c5015c699fc578e4aa43ec", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.8940517166042047, "ground_truth": 0}, {"key": "8abb66a9697a8c59348fcc79de126691e394bded", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.9092645218216807, "ground_truth": 0}, {"key": "8abb66a9697a8c59348fcc79de126691e394bded", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.8489721933840727, "ground_truth": 0}, {"key": "8abb66a9697a8c59348fcc79de126691e394bded", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.9105453995135309, "ground_truth": 0}, {"key": "8abb66a9697a8c59348fcc79de126691e394bded", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.9219218401896326, "ground_truth": 0}, {"key": "8abb66a9697a8c59348fcc79de126691e394bded", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.9046505372551358, "ground_truth": 0}, {"key": "11ec3be451b57e4312b44eeabb3ae441435c662e", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.783988483752893, "ground_truth": 0}, {"key": "11ec3be451b57e4312b44eeabb3ae441435c662e", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.9079671521893029, "ground_truth": 0}, {"key": "11ec3be451b57e4312b44eeabb3ae441435c662e", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.8469578443772307, "ground_truth": 0}, {"key": "11ec3be451b57e4312b44eeabb3ae441435c662e", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.7279754699953749, "ground_truth": 0}, {"key": "11ec3be451b57e4312b44eeabb3ae441435c662e", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.9124361590880599, "ground_truth": 0}, {"key": "eed527dece78deffed54a7cdd8516c4d57a90011", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.9525741267863381, "ground_truth": 0}, {"key": "eed527dece78deffed54a7cdd8516c4d57a90011", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.9105453994911558, "ground_truth": 0}, {"key": "eed527dece78deffed54a7cdd8516c4d57a90011", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.869714572057868, "ground_truth": 0}, {"key": "eed527dece78deffed54a7cdd8516c4d57a90011", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.9257686305872809, "ground_truth": 0}, {"key": "eed527dece78deffed54a7cdd8516c4d57a90011", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.9504109749735963, "ground_truth": 0}, {"key": "803c0dc8b3d2eb528fd084b613dfc29d98151d72", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.6992544057725102, "ground_truth": 0}, {"key": "803c0dc8b3d2eb528fd084b613dfc29d98151d72", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.8397339613106821, "ground_truth": 0}, {"key": "803c0dc8b3d2eb528fd084b613dfc29d98151d72", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.9053223006093042, "ground_truth": 0}, {"key": "803c0dc8b3d2eb528fd084b613dfc29d98151d72", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.9161096122470365, "ground_truth": 0}, {"key": "803c0dc8b3d2eb528fd084b613dfc29d98151d72", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.818736788912078, "ground_truth": 0}, {"key": "d4fb4cca753c0f5586bd93bb124b0491711396d9", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.7138307438700343, "ground_truth": 0}, {"key": "d4fb4cca753c0f5586bd93bb124b0491711396d9", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.8749346179284662, "ground_truth": 0}, {"key": "d4fb4cca753c0f5586bd93bb124b0491711396d9", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.6808786193284272, "ground_truth": 0}, {"key": "d4fb4cca753c0f5586bd93bb124b0491711396d9", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.7620700989367795, "ground_truth": 0}, {"key": "d4fb4cca753c0f5586bd93bb124b0491711396d9", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.5774953751743712, "ground_truth": 0}, {"key": "723443b1c16e2276a1aa03259a600044e86c2538", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.7662936426485838, "ground_truth": 0}, {"key": "723443b1c16e2276a1aa03259a600044e86c2538", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.8766343709560027, "ground_truth": 0}, {"key": "723443b1c16e2276a1aa03259a600044e86c2538", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.7676898654623693, "ground_truth": 0}, {"key": "723443b1c16e2276a1aa03259a600044e86c2538", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.770464785385788, "ground_truth": 0}, {"key": "723443b1c16e2276a1aa03259a600044e86c2538", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.8056321867485015, "ground_truth": 0}, {"key": "b30a8f4dbb4f8375a8a9c2ccb4f658cc66dca0f5", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.8438950972611057, "ground_truth": 0}, {"key": "b30a8f4dbb4f8375a8a9c2ccb4f658cc66dca0f5", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.8031737868009283, "ground_truth": 0}, {"key": "b30a8f4dbb4f8375a8a9c2ccb4f658cc66dca0f5", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.7041601288611692, "ground_truth": 0}, {"key": "b30a8f4dbb4f8375a8a9c2ccb4f658cc66dca0f5", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.8643104564723282, "ground_truth": 0}, {"key": "b30a8f4dbb4f8375a8a9c2ccb4f658cc66dca0f5", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.7866228282658851, "ground_truth": 0}, {"key": "f874dc1da36d2c45a65f78dc0dc9dcdf5846c3c9", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.8895288367412688, "ground_truth": 0}, {"key": "f874dc1da36d2c45a65f78dc0dc9dcdf5846c3c9", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.9761291657417666, "ground_truth": 0}, {"key": "f874dc1da36d2c45a65f78dc0dc9dcdf5846c3c9", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.744656356710668, "ground_truth": 0}, {"key": "f874dc1da36d2c45a65f78dc0dc9dcdf5846c3c9", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.8998277775634524, "ground_truth": 0}, {"key": "f874dc1da36d2c45a65f78dc0dc9dcdf5846c3c9", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.8749346274282775, "ground_truth": 0}, {"key": "60fc2801c429858cc0a87e547f1c30e34a7a96f3", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.7648916035248798, "ground_truth": 0}, {"key": "60fc2801c429858cc0a87e547f1c30e34a7a96f3", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.8221891202983079, "ground_truth": 0}, {"key": "60fc2801c429858cc0a87e547f1c30e34a7a96f3", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.8244619301163569, "ground_truth": 0}, {"key": "60fc2801c429858cc0a87e547f1c30e34a7a96f3", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.907967134888461, "ground_truth": 0}, {"key": "60fc2801c429858cc0a87e547f1c30e34a7a96f3", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.6654105555426106, "ground_truth": 0}, {"key": "d885b755dab03a11c7e3b19455b82859a6e1f76b", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.8887587891383049, "ground_truth": 0}, {"key": "d885b755dab03a11c7e3b19455b82859a6e1f76b", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.9473810498999212, "ground_truth": 0}, {"key": "d885b755dab03a11c7e3b19455b82859a6e1f76b", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.8577681039255813, "ground_truth": 0}, {"key": "d885b755dab03a11c7e3b19455b82859a6e1f76b", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.7853085834864039, "ground_truth": 0}, {"key": "d885b755dab03a11c7e3b19455b82859a6e1f76b", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.8221891245685384, "ground_truth": 0}, {"key": "9ce486aae2ad61c78b2e44d2617276a470c9f600", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.7759445501160336, "ground_truth": 0}, {"key": "9ce486aae2ad61c78b2e44d2617276a470c9f600", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.8116760127799981, "ground_truth": 0}, {"key": "9ce486aae2ad61c78b2e44d2617276a470c9f600", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.8322366559039917, "ground_truth": 0}, {"key": "9ce486aae2ad61c78b2e44d2617276a470c9f600", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.7931059367512174, "ground_truth": 0}, {"key": "9ce486aae2ad61c78b2e44d2617276a470c9f600", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.8187367831625216, "ground_truth": 0}, {"key": "162e54974cad1d0e067a97e37175951c26f13a0e", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.9711290921182685, "ground_truth": 0}, {"key": "162e54974cad1d0e067a97e37175951c26f13a0e", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.8925625264489792, "ground_truth": 0}, {"key": "162e54974cad1d0e067a97e37175951c26f13a0e", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.886420408070775, "ground_truth": 0}, {"key": "162e54974cad1d0e067a97e37175951c26f13a0e", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.9626731119405176, "ground_truth": 0}, {"key": "162e54974cad1d0e067a97e37175951c26f13a0e", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.9656413109549022, "ground_truth": 0}, {"key": "03a0cef9c902928979ef731616fb96bd1fb10f9f", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.939470608054028, "ground_truth": 0}, {"key": "03a0cef9c902928979ef731616fb96bd1fb10f9f", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.9511422196899919, "ground_truth": 0}, {"key": "03a0cef9c902928979ef731616fb96bd1fb10f9f", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.9381240107169884, "ground_truth": 0}, {"key": "03a0cef9c902928979ef731616fb96bd1fb10f9f", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.9304582534985509, "ground_truth": 0}, {"key": "03a0cef9c902928979ef731616fb96bd1fb10f9f", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.8902942282343457, "ground_truth": 0}, {"key": "6f64897fc65e1ba7531a4830a7d935ab15d8bec6", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.7534666559299193, "ground_truth": 0}, {"key": "6f64897fc65e1ba7531a4830a7d935ab15d8bec6", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.7217431990066503, "ground_truth": 0}, {"key": "6f64897fc65e1ba7531a4830a7d935ab15d8bec6", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.8840392855061706, "ground_truth": 0}, {"key": "6f64897fc65e1ba7531a4830a7d935ab15d8bec6", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.7279754383595322, "ground_truth": 0}, {"key": "6f64897fc65e1ba7531a4830a7d935ab15d8bec6", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.7931059365333579, "ground_truth": 0}, {"key": "0d7383a44955b41c5a472151a35a842751f0004c", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.6808786227958051, "ground_truth": 0}, {"key": "0d7383a44955b41c5a472151a35a842751f0004c", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.721743213830406, "ground_truth": 0}, {"key": "0d7383a44955b41c5a472151a35a842751f0004c", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.6688802922987521, "ground_truth": 0}, {"key": "0d7383a44955b41c5a472151a35a842751f0004c", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.8056321926332217, "ground_truth": 0}, {"key": "0d7383a44955b41c5a472151a35a842751f0004c", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.7759445503522386, "ground_truth": 0}, {"key": "2fddefe691f7849048548a15f6533339d4a25bfd", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.8539127448423592, "ground_truth": 0}, {"key": "2fddefe691f7849048548a15f6533339d4a25bfd", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.8887587864537978, "ground_truth": 0}, {"key": "2fddefe691f7849048548a15f6533339d4a25bfd", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.8344068827373807, "ground_truth": 0}, {"key": "2fddefe691f7849048548a15f6533339d4a25bfd", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.9111797061161828, "ground_truth": 0}, {"key": "2fddefe691f7849048548a15f6533339d4a25bfd", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.9294404019561425, "ground_truth": 0}, {"key": "e35ec8afe496d466d673ac67d80ec5c21b163410", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.8489721988288511, "ground_truth": 0}, {"key": "e35ec8afe496d466d673ac67d80ec5c21b163410", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.8031737868009283, "ground_truth": 0}, {"key": "e35ec8afe496d466d673ac67d80ec5c21b163410", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.7799928983430378, "ground_truth": 0}, {"key": "e35ec8afe496d466d673ac67d80ec5c21b163410", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.7853085871547665, "ground_truth": 0}, {"key": "e35ec8afe496d466d673ac67d80ec5c21b163410", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.8615382158019378, "ground_truth": 0}, {"key": "b4aa207f0723ae8a731dbc07ecdb03a68a42031f", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.704160129361085, "ground_truth": 0}, {"key": "b4aa207f0723ae8a731dbc07ecdb03a68a42031f", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.692641988103842, "ground_truth": 0}, {"key": "b4aa207f0723ae8a731dbc07ecdb03a68a42031f", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.8267117960689206, "ground_truth": 0}, {"key": "b4aa207f0723ae8a731dbc07ecdb03a68a42031f", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.7371581405041147, "ground_truth": 0}, {"key": "b4aa207f0723ae8a731dbc07ecdb03a68a42031f", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.7676898425508782, "ground_truth": 0}, {"key": "a65ecd71682863f7b12ca11ab8ac23b39ae302c4", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.8499711821386111, "ground_truth": 0}, {"key": "a65ecd71682863f7b12ca11ab8ac23b39ae302c4", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.9066531235744864, "ground_truth": 0}, {"key": "a65ecd71682863f7b12ca11ab8ac23b39ae302c4", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.8418256486435018, "ground_truth": 0}, {"key": "a65ecd71682863f7b12ca11ab8ac23b39ae302c4", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.9246876950005722, "ground_truth": 0}, {"key": "a65ecd71682863f7b12ca11ab8ac23b39ae302c4", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.8233283992684597, "ground_truth": 0}, {"key": "215a2a64c7bd36360f76ec5e159690de07d7d959", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.741674023384519, "ground_truth": 0}, {"key": "215a2a64c7bd36360f76ec5e159690de07d7d959", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.8438951076280948, "ground_truth": 0}, {"key": "215a2a64c7bd36360f76ec5e159690de07d7d959", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.7866228354393923, "ground_truth": 0}, {"key": "215a2a64c7bd36360f76ec5e159690de07d7d959", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.7563575424455954, "ground_truth": 0}, {"key": "215a2a64c7bd36360f76ec5e159690de07d7d959", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.6352224307088119, "ground_truth": 0}, {"key": "39074eb06df4966d1e06f76ad2f0713b31335fe5", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.890294226060351, "ground_truth": 0}, {"key": "39074eb06df4966d1e06f76ad2f0713b31335fe5", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.8910549530499227, "ground_truth": 0}, {"key": "39074eb06df4966d1e06f76ad2f0713b31335fe5", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.8344068838486961, "ground_truth": 0}, {"key": "39074eb06df4966d1e06f76ad2f0713b31335fe5", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.8407825842307157, "ground_truth": 0}, {"key": "39074eb06df4966d1e06f76ad2f0713b31335fe5", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.8164063802167962, "ground_truth": 0}, {"key": "3cae0d9bcf97b5d182b20a31aaea3f41cd7bf599", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.721743209691161, "ground_truth": 0}, {"key": "3cae0d9bcf97b5d182b20a31aaea3f41cd7bf599", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.7534666549997576, "ground_truth": 0}, {"key": "3cae0d9bcf97b5d182b20a31aaea3f41cd7bf599", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.8344068738842628, "ground_truth": 0}, {"key": "3cae0d9bcf97b5d182b20a31aaea3f41cd7bf599", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.5679366245090256, "ground_truth": 0}, {"key": "3cae0d9bcf97b5d182b20a31aaea3f41cd7bf599", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.7718435036651519, "ground_truth": 0}, {"key": "6a9ead70f9423e494c466189bc6d907071547f42", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.7892337053138909, "ground_truth": 0}, {"key": "6a9ead70f9423e494c466189bc6d907071547f42", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.9284087970353312, "ground_truth": 0}, {"key": "6a9ead70f9423e494c466189bc6d907071547f42", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.8925625324150435, "ground_truth": 0}, {"key": "6a9ead70f9423e494c466189bc6d907071547f42", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.9241418186251242, "ground_truth": 0}, {"key": "6a9ead70f9423e494c466189bc6d907071547f42", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.7981867782310964, "ground_truth": 0}, {"key": "9a15663058028878027f6aa039fb3185c2ff52c8", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.8740772349983257, "ground_truth": 0}, {"key": "9a15663058028878027f6aa039fb3185c2ff52c8", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.8210440981388799, "ground_truth": 0}, {"key": "9a15663058028878027f6aa039fb3185c2ff52c8", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.7732163765799439, "ground_truth": 0}, {"key": "9a15663058028878027f6aa039fb3185c2ff52c8", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.8418256501834966, "ground_truth": 0}, {"key": "9a15663058028878027f6aa039fb3185c2ff52c8", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.8300437678788668, "ground_truth": 0}, {"key": "83cb0c7e79d4c71703e1bd5fc346fe68be8b8b13", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.8068526143942106, "ground_truth": 0}, {"key": "83cb0c7e79d4c71703e1bd5fc346fe68be8b8b13", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.8910549536178449, "ground_truth": 0}, {"key": "83cb0c7e79d4c71703e1bd5fc346fe68be8b8b13", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.855851149889697, "ground_truth": 0}, {"key": "83cb0c7e79d4c71703e1bd5fc346fe68be8b8b13", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.8278281530173951, "ground_truth": 0}, {"key": "83cb0c7e79d4c71703e1bd5fc346fe68be8b8b13", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.8278281543844771, "ground_truth": 0}, {"key": "5eb63517219a5d2aeebd21aa66d9b69c52cfb208", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.8080672115990039, "ground_truth": 0}, {"key": "5eb63517219a5d2aeebd21aa66d9b69c52cfb208", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.5813030904379719, "ground_truth": 0}, {"key": "5eb63517219a5d2aeebd21aa66d9b69c52cfb208", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.7718434947430184, "ground_truth": 0}, {"key": "5eb63517219a5d2aeebd21aa66d9b69c52cfb208", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.8128673145455096, "ground_truth": 0}, {"key": "5eb63517219a5d2aeebd21aa66d9b69c52cfb208", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.8376199672624567, "ground_truth": 0}, {"key": "4a1de02b50578df33ea7b0cb384bdd6aaf4ee119", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.7905303087912298, "ground_truth": 0}, {"key": "4a1de02b50578df33ea7b0cb384bdd6aaf4ee119", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.7931059394480726, "ground_truth": 0}, {"key": "4a1de02b50578df33ea7b0cb384bdd6aaf4ee119", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.7138307448126726, "ground_truth": 0}, {"key": "4a1de02b50578df33ea7b0cb384bdd6aaf4ee119", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.8210441079140041, "ground_truth": 0}, {"key": "4a1de02b50578df33ea7b0cb384bdd6aaf4ee119", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.8799743623260138, "ground_truth": 0}, {"key": "ddedfc2a349fb607ed7efeda1660e9807454ddb7", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.8233283856998819, "ground_truth": 0}, {"key": "ddedfc2a349fb607ed7efeda1660e9807454ddb7", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.9124361580506355, "ground_truth": 0}, {"key": "ddedfc2a349fb607ed7efeda1660e9807454ddb7", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.8386797644166964, "ground_truth": 0}, {"key": "ddedfc2a349fb607ed7efeda1660e9807454ddb7", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.8688267765077381, "ground_truth": 0}, {"key": "ddedfc2a349fb607ed7efeda1660e9807454ddb7", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.8019358329756117, "ground_truth": 0}, {"key": "1cce8238a161fda411022c350d2b9a49072f366f", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.7248703034997186, "ground_truth": 0}, {"key": "1cce8238a161fda411022c350d2b9a49072f366f", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.7662936451300177, "ground_truth": 0}, {"key": "1cce8238a161fda411022c350d2b9a49072f366f", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.762070106522735, "ground_truth": 0}, {"key": "1cce8238a161fda411022c350d2b9a49072f366f", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.8783142507754078, "ground_truth": 0}, {"key": "1cce8238a161fda411022c350d2b9a49072f366f", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.7154240019340365, "ground_truth": 0}, {"key": "0612042c0c7d5cf6459f5435402919673c8c552f", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.8933094058252602, "ground_truth": 0}, {"key": "0612042c0c7d5cf6459f5435402919673c8c552f", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.838679763369264, "ground_truth": 0}, {"key": "0612042c0c7d5cf6459f5435402919673c8c552f", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.8267117967939851, "ground_truth": 0}, {"key": "0612042c0c7d5cf6459f5435402919673c8c552f", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.793105937698804, "ground_truth": 0}, {"key": "0612042c0c7d5cf6459f5435402919673c8c552f", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.8962513671431541, "ground_truth": 0}, {"key": "cbe1f7ee7f5d619093684cc123e3908e39d79c92", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.9453993937498781, "ground_truth": 0}, {"key": "cbe1f7ee7f5d619093684cc123e3908e39d79c92", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.9623913668355712, "ground_truth": 0}, {"key": "cbe1f7ee7f5d619093684cc123e3908e39d79c92", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.9730364988594856, "ground_truth": 0}, {"key": "cbe1f7ee7f5d619093684cc123e3908e39d79c92", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.9504109794531913, "ground_truth": 0}, {"key": "cbe1f7ee7f5d619093684cc123e3908e39d79c92", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.9615338038940311, "ground_truth": 0}, {"key": "42be47d5986a9a55b413eb57359d2d8c51b59024", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.7718435006723703, "ground_truth": 0}, {"key": "42be47d5986a9a55b413eb57359d2d8c51b59024", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.8365545726766846, "ground_truth": 0}, {"key": "42be47d5986a9a55b413eb57359d2d8c51b59024", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.7943849585616412, "ground_truth": 0}, {"key": "42be47d5986a9a55b413eb57359d2d8c51b59024", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.6601723733848128, "ground_truth": 0}, {"key": "42be47d5986a9a55b413eb57359d2d8c51b59024", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.8587185830701368, "ground_truth": 0}, {"key": "9f997964709283520a65d2ce75de7c8b154ce351", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.7170118715707979, "ground_truth": 0}, {"key": "9f997964709283520a65d2ce75de7c8b154ce351", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.7620700966866006, "ground_truth": 0}, {"key": "9f997964709283520a65d2ce75de7c8b154ce351", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.6584175025174177, "ground_truth": 0}, {"key": "9f997964709283520a65d2ce75de7c8b154ce351", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.7634837548714829, "ground_truth": 0}, {"key": "9f997964709283520a65d2ce75de7c8b154ce351", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.7138307421809424, "ground_truth": 0}, {"key": "57da930302d81b46438b0f715a5218b7174a5611", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.899827775181179, "ground_truth": 0}, {"key": "57da930302d81b46438b0f715a5218b7174a5611", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.8740772360442447, "ground_truth": 0}, {"key": "57da930302d81b46438b0f715a5218b7174a5611", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.92522995590016, "ground_truth": 0}, {"key": "57da930302d81b46438b0f715a5218b7174a5611", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.8643104451865905, "ground_truth": 0}, {"key": "57da930302d81b46438b0f715a5218b7174a5611", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.9376689603497188, "ground_truth": 0}, {"key": "bc639974d283826b3b928bf90f0951652db71fd4", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.603931845121642, "ground_truth": 0}, {"key": "bc639974d283826b3b928bf90f0951652db71fd4", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.8615382055224224, "ground_truth": 0}, {"key": "bc639974d283826b3b928bf90f0951652db71fd4", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.8164063852407643, "ground_truth": 0}, {"key": "bc639974d283826b3b928bf90f0951652db71fd4", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.6859494803070278, "ground_truth": 0}, {"key": "bc639974d283826b3b928bf90f0951652db71fd4", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.7520125658475668, "ground_truth": 0}, {"key": "304002bc095b57d14b728ccfb8d704ef39f28813", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.9105453997759981, "ground_truth": 0}, {"key": "304002bc095b57d14b728ccfb8d704ef39f28813", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.9161096109532727, "ground_truth": 0}, {"key": "304002bc095b57d14b728ccfb8d704ef39f28813", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.8740772367410027, "ground_truth": 0}, {"key": "304002bc095b57d14b728ccfb8d704ef39f28813", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.9339146288657614, "ground_truth": 0}, {"key": "304002bc095b57d14b728ccfb8d704ef39f28813", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.8969755748967909, "ground_truth": 0}, {"key": "fab941df6ecc8251b49d28715504baf4ac31dcf9", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.7341195169374851, "ground_truth": 0}, {"key": "fab941df6ecc8251b49d28715504baf4ac31dcf9", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.8233283971728472, "ground_truth": 0}, {"key": "fab941df6ecc8251b49d28715504baf4ac31dcf9", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.6926419809972488, "ground_truth": 0}, {"key": "fab941df6ecc8251b49d28715504baf4ac31dcf9", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.8499711778582736, "ground_truth": 0}, {"key": "fab941df6ecc8251b49d28715504baf4ac31dcf9", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.8044059216310362, "ground_truth": 0}, {"key": "92dec9732f4244771770150d82cd6086f40e5621", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.9173026623510221, "ground_truth": 0}, {"key": "92dec9732f4244771770150d82cd6086f40e5621", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.8991213824106966, "ground_truth": 0}, {"key": "92dec9732f4244771770150d82cd6086f40e5621", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.840782596882614, "ground_truth": 0}, {"key": "92dec9732f4244771770150d82cd6086f40e5621", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.8774767818481671, "ground_truth": 0}, {"key": "92dec9732f4244771770150d82cd6086f40e5621", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.9230391613240977, "ground_truth": 0}, {"key": "d2ed554726c632af6e2130a580964a261f8c2e60", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.6095241746337527, "ground_truth": 0}, {"key": "d2ed554726c632af6e2130a580964a261f8c2e60", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.5448013961914019, "ground_truth": 0}, {"key": "d2ed554726c632af6e2130a580964a261f8c2e60", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.5869964254970105, "ground_truth": 0}, {"key": "d2ed554726c632af6e2130a580964a261f8c2e60", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.6169358059624706, "ground_truth": 0}, {"key": "d2ed554726c632af6e2130a580964a261f8c2e60", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.702530060095335, "ground_truth": 0}, {"key": "84ab5256295369509813877f5000bb7e01e7f641", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.8376199744478762, "ground_truth": 0}, {"key": "84ab5256295369509813877f5000bb7e01e7f641", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.8104788988119177, "ground_truth": 0}, {"key": "84ab5256295369509813877f5000bb7e01e7f641", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.8311430503145788, "ground_truth": 0}, {"key": "84ab5256295369509813877f5000bb7e01e7f641", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.9252299565997492, "ground_truth": 0}, {"key": "84ab5256295369509813877f5000bb7e01e7f641", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.8840392803683029, "ground_truth": 0}, {"key": "0e3f2fa30b711144fd8e49dedd6c248542a9083c", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.8872046056684219, "ground_truth": 0}, {"key": "0e3f2fa30b711144fd8e49dedd6c248542a9083c", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.8624675224629867, "ground_truth": 0}, {"key": "0e3f2fa30b711144fd8e49dedd6c248542a9083c", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.8044059215775267, "ground_truth": 0}, {"key": "0e3f2fa30b711144fd8e49dedd6c248542a9083c", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.8300437582678403, "ground_truth": 0}, {"key": "0e3f2fa30b711144fd8e49dedd6c248542a9083c", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.8962513739091742, "ground_truth": 0}, {"key": "67ab697c3e2d707e3b7d070199b065b1541c8925", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.8940517156251657, "ground_truth": 0}, {"key": "67ab697c3e2d707e3b7d070199b065b1541c8925", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.7279754496163341, "ground_truth": 0}, {"key": "67ab697c3e2d707e3b7d070199b065b1541c8925", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.8365545573761536, "ground_truth": 0}, {"key": "67ab697c3e2d707e3b7d070199b065b1541c8925", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.7341195262785684, "ground_truth": 0}, {"key": "67ab697c3e2d707e3b7d070199b065b1541c8925", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.8791467740215455, "ground_truth": 0}, {"key": "71537a701b69838dcb68ae310c7b3bfb375c1344", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.6057990421341394, "ground_truth": 0}, {"key": "71537a701b69838dcb68ae310c7b3bfb375c1344", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.6315943239471766, "ground_truth": 0}, {"key": "71537a701b69838dcb68ae310c7b3bfb375c1344", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.7233094685444694, "ground_truth": 0}, {"key": "71537a701b69838dcb68ae310c7b3bfb375c1344", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.6370307962913744, "ground_truth": 0}, {"key": "71537a701b69838dcb68ae310c7b3bfb375c1344", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.5640984784020746, "ground_truth": 0}, {"key": "83989da5142972bb45c7f1e25ea60c6b101a9987", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.8643104574270322, "ground_truth": 0}, {"key": "83989da5142972bb45c7f1e25ea60c6b101a9987", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.8428631367067225, "ground_truth": 0}, {"key": "83989da5142972bb45c7f1e25ea60c6b101a9987", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.8344068807457141, "ground_truth": 0}, {"key": "83989da5142972bb45c7f1e25ea60c6b101a9987", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.8255897347560451, "ground_truth": 0}, {"key": "83989da5142972bb45c7f1e25ea60c6b101a9987", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.8940517214409681, "ground_truth": 0}, {"key": "cc432e8a26891d7fcb62b112f868e994532a7ba7", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.7592254120073179, "ground_truth": 0}, {"key": "cc432e8a26891d7fcb62b112f868e994532a7ba7", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.6150878386909897, "ground_truth": 0}, {"key": "cc432e8a26891d7fcb62b112f868e994532a7ba7", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.8116760277448825, "ground_truth": 0}, {"key": "cc432e8a26891d7fcb62b112f868e994532a7ba7", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.826711794227854, "ground_truth": 0}, {"key": "cc432e8a26891d7fcb62b112f868e994532a7ba7", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.7931059344189679, "ground_truth": 0}, {"key": "ef024e4ca04bd445d2915e7fe5c2c3c9b6f723a2", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.8344068790964861, "ground_truth": 0}, {"key": "ef024e4ca04bd445d2915e7fe5c2c3c9b6f723a2", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.6909762813355549, "ground_truth": 0}, {"key": "ef024e4ca04bd445d2915e7fe5c2c3c9b6f723a2", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.737158138706985, "ground_truth": 0}, {"key": "ef024e4ca04bd445d2915e7fe5c2c3c9b6f723a2", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.8459424381753866, "ground_truth": 0}, {"key": "ef024e4ca04bd445d2915e7fe5c2c3c9b6f723a2", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.7505527724898842, "ground_truth": 0}, {"key": "dfc606b97c43ac249d72cff2fe812213987a37a2", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.8783142536742432, "ground_truth": 0}, {"key": "dfc606b97c43ac249d72cff2fe812213987a37a2", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.6370308106943483, "ground_truth": 0}, {"key": "dfc606b97c43ac249d72cff2fe812213987a37a2", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.7839884759908449, "ground_truth": 0}, {"key": "dfc606b97c43ac249d72cff2fe812213987a37a2", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.7662936462651405, "ground_truth": 0}, {"key": "dfc606b97c43ac249d72cff2fe812213987a37a2", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.8407825909708053, "ground_truth": 0}, {"key": "087ac92e2ca469b5ca6277950e63b2f0706d0de2", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.5350984209219719, "ground_truth": 0}, {"key": "087ac92e2ca469b5ca6277950e63b2f0706d0de2", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.7025300562995814, "ground_truth": 0}, {"key": "087ac92e2ca469b5ca6277950e63b2f0706d0de2", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.5078118799721739, "ground_truth": 0}, {"key": "087ac92e2ca469b5ca6277950e63b2f0706d0de2", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.6477982095890565, "ground_truth": 0}, {"key": "087ac92e2ca469b5ca6277950e63b2f0706d0de2", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.5717665886978817, "ground_truth": 0}, {"key": "a1abb9ce1c76a6c390233d8ec934cfb34bc35215", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.9086178933501288, "ground_truth": 0}, {"key": "a1abb9ce1c76a6c390233d8ec934cfb34bc35215", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.8469578365261693, "ground_truth": 0}, {"key": "a1abb9ce1c76a6c390233d8ec934cfb34bc35215", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.8267117999228986, "ground_truth": 0}, {"key": "a1abb9ce1c76a6c390233d8ec934cfb34bc35215", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.8661325073351472, "ground_truth": 0}, {"key": "a1abb9ce1c76a6c390233d8ec934cfb34bc35215", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.8840392810884475, "ground_truth": 0}, {"key": "99ec57979392a7f9c1a24158d5e1262cdf113f45", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.7943849515823115, "ground_truth": 0}, {"key": "99ec57979392a7f9c1a24158d5e1262cdf113f45", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.9073122224583202, "ground_truth": 0}, {"key": "99ec57979392a7f9c1a24158d5e1262cdf113f45", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.8164063775115543, "ground_truth": 0}, {"key": "99ec57979392a7f9c1a24158d5e1262cdf113f45", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.943763653836977, "ground_truth": 0}, {"key": "99ec57979392a7f9c1a24158d5e1262cdf113f45", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.9257686330632771, "ground_truth": 0}, {"key": "ca5c0c816376354b82a4a7b9fa9a31b655e2d2cd", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.8757869866385016, "ground_truth": 0}, {"key": "ca5c0c816376354b82a4a7b9fa9a31b655e2d2cd", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.647798213431972, "ground_truth": 0}, {"key": "ca5c0c816376354b82a4a7b9fa9a31b655e2d2cd", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.7563575542334254, "ground_truth": 0}, {"key": "ca5c0c816376354b82a4a7b9fa9a31b655e2d2cd", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.6671476595873556, "ground_truth": 0}, {"key": "ca5c0c816376354b82a4a7b9fa9a31b655e2d2cd", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.8006919973765794, "ground_truth": 0}, {"key": "e9787bf9462b12b7dfc0b562510a551e7d07b4d7", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.8344068785425122, "ground_truth": 0}, {"key": "e9787bf9462b12b7dfc0b562510a551e7d07b4d7", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.8749346192923484, "ground_truth": 0}, {"key": "e9787bf9462b12b7dfc0b562510a551e7d07b4d7", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.759225404680564, "ground_truth": 0}, {"key": "e9787bf9462b12b7dfc0b562510a551e7d07b4d7", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.785308579568403, "ground_truth": 0}, {"key": "e9787bf9462b12b7dfc0b562510a551e7d07b4d7", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.7969253832862814, "ground_truth": 0}, {"key": "ed8a7d5b06b4b5415725e624a15ab5ada7146894", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.9453993934016898, "ground_truth": 0}, {"key": "ed8a7d5b06b4b5415725e624a15ab5ada7146894", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.8774767948462536, "ground_truth": 0}, {"key": "ed8a7d5b06b4b5415725e624a15ab5ada7146894", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.9437636520537515, "ground_truth": 0}, {"key": "ed8a7d5b06b4b5415725e624a15ab5ada7146894", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.909906999379068, "ground_truth": 0}, {"key": "ed8a7d5b06b4b5415725e624a15ab5ada7146894", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.8568122881034979, "ground_truth": 0}, {"key": "4b6f2532f6bb4cf4ae341e4fb72d384ef58f0f42", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.7025300457735051, "ground_truth": 0}, {"key": "4b6f2532f6bb4cf4ae341e4fb72d384ef58f0f42", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.7772998603017414, "ground_truth": 0}, {"key": "4b6f2532f6bb4cf4ae341e4fb72d384ef58f0f42", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.8697145765068196, "ground_truth": 0}, {"key": "4b6f2532f6bb4cf4ae341e4fb72d384ef58f0f42", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.7676898454479785, "ground_truth": 0}, {"key": "4b6f2532f6bb4cf4ae341e4fb72d384ef58f0f42", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.5888891444506757, "ground_truth": 0}, {"key": "46102a68e2927f930c1c2bd117ca714d188cd1ab", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.8116760190563591, "ground_truth": 0}, {"key": "46102a68e2927f930c1c2bd117ca714d188cd1ab", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.7476159362856688, "ground_truth": 0}, {"key": "46102a68e2927f930c1c2bd117ca714d188cd1ab", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.8152324927681551, "ground_truth": 0}, {"key": "46102a68e2927f930c1c2bd117ca714d188cd1ab", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.874077221178867, "ground_truth": 0}, {"key": "46102a68e2927f930c1c2bd117ca714d188cd1ab", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.8092759859687858, "ground_truth": 0}, {"key": "ee6568a8880e61a498aab80c41f70939d567c991", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.6774740004209072, "ground_truth": 0}, {"key": "ee6568a8880e61a498aab80c41f70939d567c991", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.7325918451361799, "ground_truth": 0}, {"key": "ee6568a8880e61a498aab80c41f70939d567c991", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.4804786675338727, "ground_truth": 0}, {"key": "ee6568a8880e61a498aab80c41f70939d567c991", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.6654105526702772, "ground_truth": 0}, {"key": "ee6568a8880e61a498aab80c41f70939d567c991", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.48633150914754436, "ground_truth": 0}, {"key": "8f462be265750ebbf85a6ad8ef28cb39c59f826e", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.7295197805930402, "ground_truth": 0}, {"key": "8f462be265750ebbf85a6ad8ef28cb39c59f826e", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.7074046884981824, "ground_truth": 0}, {"key": "8f462be265750ebbf85a6ad8ef28cb39c59f826e", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.8164063639290977, "ground_truth": 0}, {"key": "8f462be265750ebbf85a6ad8ef28cb39c59f826e", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.7981867819713542, "ground_truth": 0}, {"key": "8f462be265750ebbf85a6ad8ef28cb39c59f826e", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.7918210620927253, "ground_truth": 0}, {"key": "b21258342db561f79656c3c75f2e8c8244dd6178", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.8962513733430948, "ground_truth": 0}, {"key": "b21258342db561f79656c3c75f2e8c8244dd6178", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.8962513715216043, "ground_truth": 0}, {"key": "b21258342db561f79656c3c75f2e8c8244dd6178", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.896251375098835, "ground_truth": 0}, {"key": "b21258342db561f79656c3c75f2e8c8244dd6178", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.8697145823122912, "ground_truth": 0}, {"key": "b21258342db561f79656c3c75f2e8c8244dd6178", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.8479677493258884, "ground_truth": 0}, {"key": "c7b97c7c2ca7b9bedff4978dd3cae9aaef8f8100", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.7057850067720067, "ground_truth": 0}, {"key": "c7b97c7c2ca7b9bedff4978dd3cae9aaef8f8100", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.7853085783583462, "ground_truth": 0}, {"key": "c7b97c7c2ca7b9bedff4978dd3cae9aaef8f8100", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.7295197782973482, "ground_truth": 0}, {"key": "c7b97c7c2ca7b9bedff4978dd3cae9aaef8f8100", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.7217432155014771, "ground_truth": 0}, {"key": "c7b97c7c2ca7b9bedff4978dd3cae9aaef8f8100", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.6976089092464651, "ground_truth": 0}, {"key": "bdbeb9265050f2a4ce200c3802775694b7dc20e6", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.7994423172154985, "ground_truth": 0}, {"key": "bdbeb9265050f2a4ce200c3802775694b7dc20e6", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.7620701035731133, "ground_truth": 0}, {"key": "bdbeb9265050f2a4ce200c3802775694b7dc20e6", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.8529354795360569, "ground_truth": 0}, {"key": "bdbeb9265050f2a4ce200c3802775694b7dc20e6", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.763483767376912, "ground_truth": 0}, {"key": "bdbeb9265050f2a4ce200c3802775694b7dc20e6", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.7577943577379048, "ground_truth": 0}, {"key": "42e93d5aef7547b8169f1f6c7735d0265a030580", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.7745833867281992, "ground_truth": 0}, {"key": "42e93d5aef7547b8169f1f6c7735d0265a030580", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.7981867670797695, "ground_truth": 0}, {"key": "42e93d5aef7547b8169f1f6c7735d0265a030580", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.5755880222240551, "ground_truth": 0}, {"key": "42e93d5aef7547b8169f1f6c7735d0265a030580", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.6566582610548425, "ground_truth": 0}, {"key": "42e93d5aef7547b8169f1f6c7735d0265a030580", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.7138307632198136, "ground_truth": 0}, {"key": "6e7a607934780f0011aa4e84509314efe15c2685", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.7718434879291173, "ground_truth": 0}, {"key": "6e7a607934780f0011aa4e84509314efe15c2685", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.7786493053636835, "ground_truth": 0}, {"key": "6e7a607934780f0011aa4e84509314efe15c2685", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.5755880418730382, "ground_truth": 0}, {"key": "6e7a607934780f0011aa4e84509314efe15c2685", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.7057850567155852, "ground_truth": 0}, {"key": "6e7a607934780f0011aa4e84509314efe15c2685", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.7662936328266536, "ground_truth": 0}, {"key": "c087e2af172aed145b177c9a1a68029205bc732a", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.8624675308062614, "ground_truth": 0}, {"key": "c087e2af172aed145b177c9a1a68029205bc732a", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.7813306305295821, "ground_truth": 0}, {"key": "c087e2af172aed145b177c9a1a68029205bc732a", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.7549149970868005, "ground_truth": 0}, {"key": "c087e2af172aed145b177c9a1a68029205bc732a", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.7718435041412103, "ground_truth": 0}, {"key": "c087e2af172aed145b177c9a1a68029205bc732a", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.7217432130479601, "ground_truth": 0}, {"key": "40e79de5b7a27d7161b147725936d1d47e45c8f9", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.8386797679078625, "ground_truth": 0}, {"key": "40e79de5b7a27d7161b147725936d1d47e45c8f9", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.7853085822480481, "ground_truth": 0}, {"key": "40e79de5b7a27d7161b147725936d1d47e45c8f9", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.8175744744431349, "ground_truth": 0}, {"key": "40e79de5b7a27d7161b147725936d1d47e45c8f9", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.869714572592212, "ground_truth": 0}, {"key": "40e79de5b7a27d7161b147725936d1d47e45c8f9", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.7341195414218891, "ground_truth": 0}, {"key": "e878909ace599352d3d578796968bbd52cb299bd", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.7994423128702925, "ground_truth": 0}, {"key": "e878909ace599352d3d578796968bbd52cb299bd", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.7534666529227986, "ground_truth": 0}, {"key": "e878909ace599352d3d578796968bbd52cb299bd", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.7549149962622007, "ground_truth": 0}, {"key": "e878909ace599352d3d578796968bbd52cb299bd", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.6584175100554778, "ground_truth": 0}, {"key": "e878909ace599352d3d578796968bbd52cb299bd", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.6976089320391373, "ground_truth": 0}, {"key": "470708aab0fe600a27423bf4a2f8c9860fe5f64b", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.8080672072656558, "ground_truth": 0}, {"key": "470708aab0fe600a27423bf4a2f8c9860fe5f64b", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.8568123000065655, "ground_truth": 0}, {"key": "470708aab0fe600a27423bf4a2f8c9860fe5f64b", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.7122321770773463, "ground_truth": 0}, {"key": "470708aab0fe600a27423bf4a2f8c9860fe5f64b", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.7981867875776623, "ground_truth": 0}, {"key": "470708aab0fe600a27423bf4a2f8c9860fe5f64b", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.8824278656039414, "ground_truth": 0}, {"key": "16e8cb520c874af6825d4661f6127a67efd4b6f6", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.8606036164868697, "ground_truth": 0}, {"key": "16e8cb520c874af6825d4661f6127a67efd4b6f6", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.8499711762332732, "ground_truth": 0}, {"key": "16e8cb520c874af6825d4661f6127a67efd4b6f6", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.8624675250515873, "ground_truth": 0}, {"key": "16e8cb520c874af6825d4661f6127a67efd4b6f6", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.9304582569867449, "ground_truth": 0}, {"key": "16e8cb520c874af6825d4661f6127a67efd4b6f6", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.8652240876194562, "ground_truth": 0}, {"key": "38673348ff28676905791fe3e8db2bbda814d974", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.6740504621705526, "ground_truth": 0}, {"key": "38673348ff28676905791fe3e8db2bbda814d974", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.6206215987335519, "ground_truth": 0}, {"key": "38673348ff28676905791fe3e8db2bbda814d974", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.7826624728579031, "ground_truth": 0}, {"key": "38673348ff28676905791fe3e8db2bbda814d974", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.8587185770882483, "ground_truth": 0}, {"key": "38673348ff28676905791fe3e8db2bbda814d974", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.6976089078721324, "ground_truth": 0}, {"key": "914a0163e25ecccb635b601837cc4dd552c66ce0", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.6774740058317745, "ground_truth": 0}, {"key": "914a0163e25ecccb635b601837cc4dd552c66ce0", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.785308592049446, "ground_truth": 0}, {"key": "914a0163e25ecccb635b601837cc4dd552c66ce0", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.558326980163419, "ground_truth": 0}, {"key": "914a0163e25ecccb635b601837cc4dd552c66ce0", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.6315942891663264, "ground_truth": 0}, {"key": "914a0163e25ecccb635b601837cc4dd552c66ce0", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.7563575438787433, "ground_truth": 0}, {"key": "851c7314af56b6f47742970e11696948323dfe94", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.858718578600763, "ground_truth": 0}, {"key": "851c7314af56b6f47742970e11696948323dfe94", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.855851143167842, "ground_truth": 0}, {"key": "851c7314af56b6f47742970e11696948323dfe94", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.8947894707831447, "ground_truth": 0}, {"key": "851c7314af56b6f47742970e11696948323dfe94", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.8955226823884818, "ground_truth": 0}, {"key": "851c7314af56b6f47742970e11696948323dfe94", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.9019206729335765, "ground_truth": 0}, {"key": "f29f04e8f0615b768dd756c4387e87e27b7b4c2d", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.7879311842594661, "ground_truth": 0}, {"key": "f29f04e8f0615b768dd756c4387e87e27b7b4c2d", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.7401743531744308, "ground_truth": 0}, {"key": "f29f04e8f0615b768dd756c4387e87e27b7b4c2d", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.8255897264285506, "ground_truth": 0}, {"key": "f29f04e8f0615b768dd756c4387e87e27b7b4c2d", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.7074046869319214, "ground_truth": 0}, {"key": "f29f04e8f0615b768dd756c4387e87e27b7b4c2d", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.6566582681628479, "ground_truth": 0}, {"key": "8451164e86012e6dbf2fd39f7e6ca784ff9f3624", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.8757869971492652, "ground_truth": 0}, {"key": "8451164e86012e6dbf2fd39f7e6ca784ff9f3624", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.9278877999149236, "ground_truth": 0}, {"key": "8451164e86012e6dbf2fd39f7e6ca784ff9f3624", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.8799743861170874, "ground_truth": 0}, {"key": "8451164e86012e6dbf2fd39f7e6ca784ff9f3624", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.9196425393028299, "ground_truth": 0}, {"key": "8451164e86012e6dbf2fd39f7e6ca784ff9f3624", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.9385759586902063, "ground_truth": 0}, {"key": "18765fda59852b1c13eb226a2da9ab0979739f44", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.8840392831409714, "ground_truth": 0}, {"key": "18765fda59852b1c13eb226a2da9ab0979739f44", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.8509646972813983, "ground_truth": 0}, {"key": "18765fda59852b1c13eb226a2da9ab0979739f44", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.9073122154528342, "ground_truth": 0}, {"key": "18765fda59852b1c13eb226a2da9ab0979739f44", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.8895288521992438, "ground_truth": 0}, {"key": "18765fda59852b1c13eb226a2da9ab0979739f44", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.9219218375226875, "ground_truth": 0}, {"key": "fba410776268aaf447802e66ac94e4af54f7cb7a", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.942928601444855, "ground_truth": 0}, {"key": "fba410776268aaf447802e66ac94e4af54f7cb7a", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.9485372370160162, "ground_truth": 0}, {"key": "fba410776268aaf447802e66ac94e4af54f7cb7a", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.9319595763336538, "ground_truth": 0}, {"key": "fba410776268aaf447802e66ac94e4af54f7cb7a", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.9549844674527342, "ground_truth": 0}, {"key": "fba410776268aaf447802e66ac94e4af54f7cb7a", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.9155072416617339, "ground_truth": 0}, {"key": "31494e5d6eda2042c4793ae68cea4b8304dfa0ad", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.8633916063880784, "ground_truth": 0}, {"key": "31494e5d6eda2042c4793ae68cea4b8304dfa0ad", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.9066531202400603, "ground_truth": 0}, {"key": "31494e5d6eda2042c4793ae68cea4b8304dfa0ad", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.9241418235786311, "ground_truth": 0}, {"key": "31494e5d6eda2042c4793ae68cea4b8304dfa0ad", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.9416541578914756, "ground_truth": 0}, {"key": "31494e5d6eda2042c4793ae68cea4b8304dfa0ad", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.9429286033596075, "ground_truth": 0}, {"key": "564bdb9bbcd2276bdfbdce6eb1e2058f0921bd82", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.8056321771144713, "ground_truth": 0}, {"key": "564bdb9bbcd2276bdfbdce6eb1e2058f0921bd82", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.8386797515953239, "ground_truth": 0}, {"key": "564bdb9bbcd2276bdfbdce6eb1e2058f0921bd82", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.891811047773343, "ground_truth": 0}, {"key": "564bdb9bbcd2276bdfbdce6eb1e2058f0921bd82", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.7122321866427683, "ground_truth": 0}, {"key": "564bdb9bbcd2276bdfbdce6eb1e2058f0921bd82", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.9246876927892692, "ground_truth": 0}, {"key": "acbacec078274c02aeae06061357d02d950fec33", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.8255897224885846, "ground_truth": 0}, {"key": "acbacec078274c02aeae06061357d02d950fec33", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.8933094042919507, "ground_truth": 0}, {"key": "acbacec078274c02aeae06061357d02d950fec33", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.9257686284337241, "ground_truth": 0}, {"key": "acbacec078274c02aeae06061357d02d950fec33", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.8902942270876023, "ground_truth": 0}, {"key": "acbacec078274c02aeae06061357d02d950fec33", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.8624675260116274, "ground_truth": 0}, {"key": "04327bc3e426eee01ed61d369fd52415aa300ddc", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.8895288546994715, "ground_truth": 0}, {"key": "04327bc3e426eee01ed61d369fd52415aa300ddc", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.7057850367146866, "ground_truth": 0}, {"key": "04327bc3e426eee01ed61d369fd52415aa300ddc", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.7772998509952962, "ground_truth": 0}, {"key": "04327bc3e426eee01ed61d369fd52415aa300ddc", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.8774767925116759, "ground_truth": 0}, {"key": "04327bc3e426eee01ed61d369fd52415aa300ddc", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.7325918477634041, "ground_truth": 0}, {"key": "b1f3d2adb48370e5ecadff8e6e3baff407b01f0e", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.9053222947774945, "ground_truth": 0}, {"key": "b1f3d2adb48370e5ecadff8e6e3baff407b01f0e", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.7090191288555763, "ground_truth": 0}, {"key": "b1f3d2adb48370e5ecadff8e6e3baff407b01f0e", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.7826624828697093, "ground_truth": 0}, {"key": "b1f3d2adb48370e5ecadff8e6e3baff407b01f0e", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.6757646087466153, "ground_truth": 0}, {"key": "b1f3d2adb48370e5ecadff8e6e3baff407b01f0e", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.5964331333720816, "ground_truth": 0}, {"key": "d7eaf2e5ca91bf54c05ead867e5e90728d44e218", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.9329437131868533, "ground_truth": 0}, {"key": "d7eaf2e5ca91bf54c05ead867e5e90728d44e218", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.9353465072335433, "ground_truth": 0}, {"key": "d7eaf2e5ca91bf54c05ead867e5e90728d44e218", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.9603611574554769, "ground_truth": 0}, {"key": "d7eaf2e5ca91bf54c05ead867e5e90728d44e218", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.9575961699144753, "ground_truth": 0}, {"key": "d7eaf2e5ca91bf54c05ead867e5e90728d44e218", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.9591542837284189, "ground_truth": 0}, {"key": "1fcce9f667de2a14d76aaa6cdb3f1e6f7900e463", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.9757623655248244, "ground_truth": 0}, {"key": "1fcce9f667de2a14d76aaa6cdb3f1e6f7900e463", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.9207896843135975, "ground_truth": 0}, {"key": "1fcce9f667de2a14d76aaa6cdb3f1e6f7900e463", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.9529258219798191, "ground_truth": 0}, {"key": "1fcce9f667de2a14d76aaa6cdb3f1e6f7900e463", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.9437636526693545, "ground_truth": 0}, {"key": "1fcce9f667de2a14d76aaa6cdb3f1e6f7900e463", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.9416541624993305, "ground_truth": 0}, {"key": "892f75a4d31560b60aa588faa6f4bf51322b8c18", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.9230391612032895, "ground_truth": 0}, {"key": "892f75a4d31560b60aa588faa6f4bf51322b8c18", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.9111797029412594, "ground_truth": 0}, {"key": "892f75a4d31560b60aa588faa6f4bf51322b8c18", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.9304582578071038, "ground_truth": 0}, {"key": "892f75a4d31560b60aa588faa6f4bf51322b8c18", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.8244619270416859, "ground_truth": 0}, {"key": "892f75a4d31560b60aa588faa6f4bf51322b8c18", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.9086178976774352, "ground_truth": 0}, {"key": "acf12bd8d1142648b1b522a3a925e14e48b8f068", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.8152324887671885, "ground_truth": 0}, {"key": "acf12bd8d1142648b1b522a3a925e14e48b8f068", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.8991213824106966, "ground_truth": 0}, {"key": "acf12bd8d1142648b1b522a3a925e14e48b8f068", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.8652240743919246, "ground_truth": 0}, {"key": "acf12bd8d1142648b1b522a3a925e14e48b8f068", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.8940517173702749, "ground_truth": 0}, {"key": "acf12bd8d1142648b1b522a3a925e14e48b8f068", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.9118099569100412, "ground_truth": 0}, {"key": "c8caeb08b05cc56e1ac29146793ceb07e4c0de69", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.9118099523386372, "ground_truth": 0}, {"key": "c8caeb08b05cc56e1ac29146793ceb07e4c0de69", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.9546474214103281, "ground_truth": 0}, {"key": "c8caeb08b05cc56e1ac29146793ceb07e4c0de69", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.9425067241121747, "ground_truth": 0}, {"key": "c8caeb08b05cc56e1ac29146793ceb07e4c0de69", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.9469902299813511, "ground_truth": 0}, {"key": "c8caeb08b05cc56e1ac29146793ceb07e4c0de69", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.9329437141218113, "ground_truth": 0}, {"key": "ed7ed4440f5f7082230ae745d240350a4f20b8b7", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.7759445391424854, "ground_truth": 0}, {"key": "ed7ed4440f5f7082230ae745d240350a4f20b8b7", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.7704647896855423, "ground_truth": 0}, {"key": "ed7ed4440f5f7082230ae745d240350a4f20b8b7", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.7057850283835101, "ground_truth": 0}, {"key": "ed7ed4440f5f7082230ae745d240350a4f20b8b7", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.824461930996415, "ground_truth": 0}, {"key": "ed7ed4440f5f7082230ae745d240350a4f20b8b7", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.7217432097745551, "ground_truth": 0}, {"key": "25b7adf8bfe43c2953a874b18c7766370158638a", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.7549150035467593, "ground_truth": 0}, {"key": "25b7adf8bfe43c2953a874b18c7766370158638a", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.7534666604710809, "ground_truth": 0}, {"key": "25b7adf8bfe43c2953a874b18c7766370158638a", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.6388352873656948, "ground_truth": 0}, {"key": "25b7adf8bfe43c2953a874b18c7766370158638a", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.7813306356241221, "ground_truth": 0}, {"key": "25b7adf8bfe43c2953a874b18c7766370158638a", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.8140527948431946, "ground_truth": 0}, {"key": "771c125e3b0c54f1c3367b2857f15d689f081163", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.8947894672730962, "ground_truth": 0}, {"key": "771c125e3b0c54f1c3367b2857f15d689f081163", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.8998277789599841, "ground_truth": 0}, {"key": "771c125e3b0c54f1c3367b2857f15d689f081163", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.9039745086152243, "ground_truth": 0}, {"key": "771c125e3b0c54f1c3367b2857f15d689f081163", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.8940517194843025, "ground_truth": 0}, {"key": "771c125e3b0c54f1c3367b2857f15d689f081163", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.8848377692615133, "ground_truth": 0}, {"key": "4ad70f84c363e5b594da00983e2b40600f12ca54", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.856812291687715, "ground_truth": 0}, {"key": "4ad70f84c363e5b594da00983e2b40600f12ca54", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.8418256483547639, "ground_truth": 0}, {"key": "4ad70f84c363e5b594da00983e2b40600f12ca54", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.873214828510596, "ground_truth": 0}, {"key": "4ad70f84c363e5b594da00983e2b40600f12ca54", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.9039745072966774, "ground_truth": 0}, {"key": "4ad70f84c363e5b594da00983e2b40600f12ca54", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.9032942155869383, "ground_truth": 0}, {"key": "cbb5654e979eb27e0af71068cd4e4e5191df35ee", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.8354835455572296, "ground_truth": 0}, {"key": "cbb5654e979eb27e0af71068cd4e4e5191df35ee", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.8140528014014796, "ground_truth": 0}, {"key": "cbb5654e979eb27e0af71068cd4e4e5191df35ee", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.8354835439980575, "ground_truth": 0}, {"key": "cbb5654e979eb27e0af71068cd4e4e5191df35ee", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.9155072435556462, "ground_truth": 0}, {"key": "cbb5654e979eb27e0af71068cd4e4e5191df35ee", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.8068526190295794, "ground_truth": 0}, {"key": "bde6b7e505c05a15a9afe44739e7f016ce169735", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.5136684598830177, "ground_truth": 0}, {"key": "bde6b7e505c05a15a9afe44739e7f016ce169735", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.7201715054393961, "ground_truth": 0}, {"key": "bde6b7e505c05a15a9afe44739e7f016ce169735", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.7461389835457302, "ground_truth": 0}, {"key": "bde6b7e505c05a15a9afe44739e7f016ce169735", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.6671476619347579, "ground_truth": 0}, {"key": "bde6b7e505c05a15a9afe44739e7f016ce169735", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.6723316889745375, "ground_truth": 0}, {"key": "abc4744227c6bf0ddbf64cac2269bd4c6d02938b", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.6113819755385861, "ground_truth": 0}, {"key": "abc4744227c6bf0ddbf64cac2269bd4c6d02938b", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.6757645976184403, "ground_truth": 0}, {"key": "abc4744227c6bf0ddbf64cac2269bd4c6d02938b", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.6584174925989598, "ground_truth": 0}, {"key": "abc4744227c6bf0ddbf64cac2269bd4c6d02938b", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.6370307885405958, "ground_truth": 0}, {"key": "abc4744227c6bf0ddbf64cac2269bd4c6d02938b", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.5717665984354385, "ground_truth": 0}, {"key": "f7e5e75031e9f099564ed046bd822ef1bedb3188", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.7341195286950494, "ground_truth": 0}, {"key": "f7e5e75031e9f099564ed046bd822ef1bedb3188", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.8670357562766663, "ground_truth": 0}, {"key": "f7e5e75031e9f099564ed046bd822ef1bedb3188", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.6992544141968118, "ground_truth": 0}, {"key": "f7e5e75031e9f099564ed046bd822ef1bedb3188", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.8175744794611156, "ground_truth": 0}, {"key": "f7e5e75031e9f099564ed046bd822ef1bedb3188", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.7826624814685788, "ground_truth": 0}, {"key": "9a8ee7eb582f293c617eecab5f37374d9400bb04", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.8386797550538924, "ground_truth": 0}, {"key": "9a8ee7eb582f293c617eecab5f37374d9400bb04", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.6876299866117777, "ground_truth": 0}, {"key": "9a8ee7eb582f293c617eecab5f37374d9400bb04", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.8558511477082982, "ground_truth": 0}, {"key": "9a8ee7eb582f293c617eecab5f37374d9400bb04", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.6992544089693962, "ground_truth": 0}, {"key": "9a8ee7eb582f293c617eecab5f37374d9400bb04", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.6943026640849085, "ground_truth": 0}, {"key": "a745e5a95be983cde00f3d472062c0627db3113c", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.7918210748680872, "ground_truth": 0}, {"key": "a745e5a95be983cde00f3d472062c0627db3113c", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.9012274051310869, "ground_truth": 0}, {"key": "a745e5a95be983cde00f3d472062c0627db3113c", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.8969755781959902, "ground_truth": 0}, {"key": "a745e5a95be983cde00f3d472062c0627db3113c", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.7905303135547044, "ground_truth": 0}, {"key": "a745e5a95be983cde00f3d472062c0627db3113c", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.6548947354679627, "ground_truth": 0}, {"key": "698cdb1268d4da1240d7f540bd4a5af4e229d00f", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.8624675239228415, "ground_truth": 0}, {"key": "698cdb1268d4da1240d7f540bd4a5af4e229d00f", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.6825737282161216, "ground_truth": 0}, {"key": "698cdb1268d4da1240d7f540bd4a5af4e229d00f", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.7879311842859856, "ground_truth": 0}, {"key": "698cdb1268d4da1240d7f540bd4a5af4e229d00f", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.651354855057409, "ground_truth": 0}, {"key": "698cdb1268d4da1240d7f540bd4a5af4e229d00f", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.6584174993645208, "ground_truth": 0}, {"key": "708c903fbf6a7c3c84f84ff34496eb0cb51f44e4", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.8019358283583414, "ground_truth": 0}, {"key": "708c903fbf6a7c3c84f84ff34496eb0cb51f44e4", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.8799743609394124, "ground_truth": 0}, {"key": "708c903fbf6a7c3c84f84ff34496eb0cb51f44e4", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.9511422221350009, "ground_truth": 0}, {"key": "708c903fbf6a7c3c84f84ff34496eb0cb51f44e4", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.9263037298600956, "ground_truth": 0}, {"key": "708c903fbf6a7c3c84f84ff34496eb0cb51f44e4", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.8438950908499652, "ground_truth": 0}, {"key": "26a1bafbde5cc970d5aee024dc8ef418587018a9", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.866132506566047, "ground_truth": 0}, {"key": "26a1bafbde5cc970d5aee024dc8ef418587018a9", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.8006919898700091, "ground_truth": 0}, {"key": "26a1bafbde5cc970d5aee024dc8ef418587018a9", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.7745833819173068, "ground_truth": 0}, {"key": "26a1bafbde5cc970d5aee024dc8ef418587018a9", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.8407825937747043, "ground_truth": 0}, {"key": "26a1bafbde5cc970d5aee024dc8ef418587018a9", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.8984105518100258, "ground_truth": 0}, {"key": "6832312991fe5d87d0e300374ec7a699a921f06a", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.6057990530839353, "ground_truth": 0}, {"key": "6832312991fe5d87d0e300374ec7a699a921f06a", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.759225387916883, "ground_truth": 0}, {"key": "6832312991fe5d87d0e300374ec7a699a921f06a", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.5292633854254747, "ground_truth": 0}, {"key": "6832312991fe5d87d0e300374ec7a699a921f06a", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.7041601214498227, "ground_truth": 0}, {"key": "6832312991fe5d87d0e300374ec7a699a921f06a", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.7279754271333614, "ground_truth": 0}, {"key": "9c5d5d672c2549a594b801897a27dde1492e11d5", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.901920675136383, "ground_truth": 0}, {"key": "9c5d5d672c2549a594b801897a27dde1492e11d5", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.9053222934079328, "ground_truth": 0}, {"key": "9c5d5d672c2549a594b801897a27dde1492e11d5", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.953275041550134, "ground_truth": 0}, {"key": "9c5d5d672c2549a594b801897a27dde1492e11d5", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.9399133516048277, "ground_truth": 0}, {"key": "9c5d5d672c2549a594b801897a27dde1492e11d5", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.9637799415990996, "ground_truth": 0}, {"key": "c32fa9084fe8cd565890a940794e505d5f7ba4c2", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.8278281458499254, "ground_truth": 0}, {"key": "c32fa9084fe8cd565890a940794e505d5f7ba4c2", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.724870284890608, "ground_truth": 0}, {"key": "c32fa9084fe8cd565890a940794e505d5f7ba4c2", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.87234738202325, "ground_truth": 0}, {"key": "c32fa9084fe8cd565890a940794e505d5f7ba4c2", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.867035751503484, "ground_truth": 0}, {"key": "c32fa9084fe8cd565890a940794e505d5f7ba4c2", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.828938817185278, "ground_truth": 0}, {"key": "41b5dd6064864c16fbde9b46d37c9f7d9a56e705", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.8031737953864451, "ground_truth": 0}, {"key": "41b5dd6064864c16fbde9b46d37c9f7d9a56e705", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.8925625308663572, "ground_truth": 0}, {"key": "41b5dd6064864c16fbde9b46d37c9f7d9a56e705", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.8984105548044353, "ground_truth": 0}, {"key": "41b5dd6064864c16fbde9b46d37c9f7d9a56e705", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.689305633928128, "ground_truth": 0}, {"key": "41b5dd6064864c16fbde9b46d37c9f7d9a56e705", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.8068526227398382, "ground_truth": 0}, {"key": "b2d3ba739af767da7aa25c3ba8e1d186168c3394", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.9019206756079022, "ground_truth": 0}, {"key": "b2d3ba739af767da7aa25c3ba8e1d186168c3394", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.9046505357684782, "ground_truth": 0}, {"key": "b2d3ba739af767da7aa25c3ba8e1d186168c3394", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.7892337087151893, "ground_truth": 0}, {"key": "b2d3ba739af767da7aa25c3ba8e1d186168c3394", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.8816149026414479, "ground_truth": 0}, {"key": "b2d3ba739af767da7aa25c3ba8e1d186168c3394", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.9046505400601974, "ground_truth": 0}, {"key": "519fd9b5c5ca82979cdfee3c990c3590838d93c7", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.6757645926069444, "ground_truth": 0}, {"key": "519fd9b5c5ca82979cdfee3c990c3590838d93c7", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.8732148300548475, "ground_truth": 0}, {"key": "519fd9b5c5ca82979cdfee3c990c3590838d93c7", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.705785007740983, "ground_truth": 0}, {"key": "519fd9b5c5ca82979cdfee3c990c3590838d93c7", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.7248702658049111, "ground_truth": 0}, {"key": "519fd9b5c5ca82979cdfee3c990c3590838d93c7", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.8267118002329947, "ground_truth": 0}, {"key": "60f518dff20b2936b104035b1fd9584dd7d16def", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.7577943658246963, "ground_truth": 0}, {"key": "60f518dff20b2936b104035b1fd9584dd7d16def", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.762070101691435, "ground_truth": 0}, {"key": "60f518dff20b2936b104035b1fd9584dd7d16def", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.6842640238668231, "ground_truth": 0}, {"key": "60f518dff20b2936b104035b1fd9584dd7d16def", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.5660185583971844, "ground_truth": 0}, {"key": "60f518dff20b2936b104035b1fd9584dd7d16def", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.727975442888068, "ground_truth": 0}, {"key": "b82546b760716f0a2b26606b07af0fe0dd61d6ff", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.7905303124818058, "ground_truth": 0}, {"key": "b82546b760716f0a2b26606b07af0fe0dd61d6ff", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.7592254019046438, "ground_truth": 0}, {"key": "b82546b760716f0a2b26606b07af0fe0dd61d6ff", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.8104789078461995, "ground_truth": 0}, {"key": "b82546b760716f0a2b26606b07af0fe0dd61d6ff", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.825589727777499, "ground_truth": 0}, {"key": "b82546b760716f0a2b26606b07af0fe0dd61d6ff", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.732591840151531, "ground_truth": 0}, {"key": "7990fde4a924299fab79f6c8e2b447ee5ffcd1fc", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.74761594253636, "ground_truth": 0}, {"key": "7990fde4a924299fab79f6c8e2b447ee5ffcd1fc", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.7786493071826032, "ground_truth": 0}, {"key": "7990fde4a924299fab79f6c8e2b447ee5ffcd1fc", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.5640984860635591, "ground_truth": 0}, {"key": "7990fde4a924299fab79f6c8e2b447ee5ffcd1fc", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.8766343856957554, "ground_truth": 0}, {"key": "7990fde4a924299fab79f6c8e2b447ee5ffcd1fc", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.7563575671788606, "ground_truth": 0}, {"key": "504f6f6e1aea6bb73c728d12a1342faa6828aace", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.9969839336350439, "ground_truth": 0}, {"key": "504f6f6e1aea6bb73c728d12a1342faa6828aace", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.9937100978263465, "ground_truth": 0}, {"key": "504f6f6e1aea6bb73c728d12a1342faa6828aace", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.9967775157090852, "ground_truth": 0}, {"key": "504f6f6e1aea6bb73c728d12a1342faa6828aace", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.9943580917584746, "ground_truth": 0}, {"key": "504f6f6e1aea6bb73c728d12a1342faa6828aace", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.9933071494546929, "ground_truth": 0}, {"key": "ef42653bf9337de184e74be0160b807a41b526fd", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.9793540690565461, "ground_truth": 0}, {"key": "ef42653bf9337de184e74be0160b807a41b526fd", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.9843363504608215, "ground_truth": 0}, {"key": "ef42653bf9337de184e74be0160b807a41b526fd", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.9768465914829229, "ground_truth": 0}, {"key": "ef42653bf9337de184e74be0160b807a41b526fd", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.9686195684967761, "ground_truth": 0}, {"key": "ef42653bf9337de184e74be0160b807a41b526fd", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.986878728731754, "ground_truth": 0}, {"key": "26d0a5624f3ee7605833c641da5d88e2259b1162", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.8558511552890465, "ground_truth": 0}, {"key": "26d0a5624f3ee7605833c641da5d88e2259b1162", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.9073122230708829, "ground_truth": 0}, {"key": "26d0a5624f3ee7605833c641da5d88e2259b1162", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.8587185747336337, "ground_truth": 0}, {"key": "26d0a5624f3ee7605833c641da5d88e2259b1162", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.8499711816876151, "ground_truth": 0}, {"key": "26d0a5624f3ee7605833c641da5d88e2259b1162", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.8322366564279456, "ground_truth": 0}, {"key": "7e43e9a2c67829721ff9f68147285c579e2c8a70", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.523420350925796, "ground_truth": 0}, {"key": "7e43e9a2c67829721ff9f68147285c579e2c8a70", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.6424324920102648, "ground_truth": 0}, {"key": "7e43e9a2c67829721ff9f68147285c579e2c8a70", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.6531268977459118, "ground_truth": 0}, {"key": "7e43e9a2c67829721ff9f68147285c579e2c8a70", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.5331544053790321, "ground_truth": 0}, {"key": "7e43e9a2c67829721ff9f68147285c579e2c8a70", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.7295197522050086, "ground_truth": 0}, {"key": "2137ee3e39b5c0d12e17bbd1e10eb75495a3a83b", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.5058590936256129, "ground_truth": 0}, {"key": "2137ee3e39b5c0d12e17bbd1e10eb75495a3a83b", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.638835279024033, "ground_truth": 0}, {"key": "2137ee3e39b5c0d12e17bbd1e10eb75495a3a83b", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.27202456175097156, "ground_truth": 0}, {"key": "2137ee3e39b5c0d12e17bbd1e10eb75495a3a83b", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.4765796474235969, "ground_truth": 0}, {"key": "2137ee3e39b5c0d12e17bbd1e10eb75495a3a83b", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.33458941466365955, "ground_truth": 0}, {"key": "31defcc44013caae59c0bdbcedd16be150413bd5", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.7401743805146532, "ground_truth": 0}, {"key": "31defcc44013caae59c0bdbcedd16be150413bd5", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.7577943634296491, "ground_truth": 0}, {"key": "31defcc44013caae59c0bdbcedd16be150413bd5", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.7786493043055492, "ground_truth": 0}, {"key": "31defcc44013caae59c0bdbcedd16be150413bd5", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.7248702727188979, "ground_truth": 0}, {"key": "31defcc44013caae59c0bdbcedd16be150413bd5", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.7122321554976514, "ground_truth": 0}, {"key": "db73dc3466e4e92672d716c1eb2ac9430ac69951", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.8848377716562731, "ground_truth": 0}, {"key": "db73dc3466e4e92672d716c1eb2ac9430ac69951", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.9539660980923534, "ground_truth": 0}, {"key": "db73dc3466e4e92672d716c1eb2ac9430ac69951", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.8376199746538293, "ground_truth": 0}, {"key": "db73dc3466e4e92672d716c1eb2ac9430ac69951", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.8596637477873924, "ground_truth": 0}, {"key": "db73dc3466e4e92672d716c1eb2ac9430ac69951", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.8940517189320927, "ground_truth": 0}, {"key": "3f6308f2f5b6ccdb89d7b6abe1b9490cc30b8e5f", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.7106282848909068, "ground_truth": 0}, {"key": "3f6308f2f5b6ccdb89d7b6abe1b9490cc30b8e5f", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.7371581454395287, "ground_truth": 0}, {"key": "3f6308f2f5b6ccdb89d7b6abe1b9490cc30b8e5f", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.7106282875680808, "ground_truth": 0}, {"key": "3f6308f2f5b6ccdb89d7b6abe1b9490cc30b8e5f", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.613236535923388, "ground_truth": 0}, {"key": "3f6308f2f5b6ccdb89d7b6abe1b9490cc30b8e5f", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.660172375313128, "ground_truth": 0}, {"key": "068d37f7a1ee822245dbf9d0d8ddfc281919d7ee", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.7386690681418153, "ground_truth": 0}, {"key": "068d37f7a1ee822245dbf9d0d8ddfc281919d7ee", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.8749346153338073, "ground_truth": 0}, {"key": "068d37f7a1ee822245dbf9d0d8ddfc281919d7ee", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.7170118636183582, "ground_truth": 0}, {"key": "068d37f7a1ee822245dbf9d0d8ddfc281919d7ee", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.6548947179736364, "ground_truth": 0}, {"key": "068d37f7a1ee822245dbf9d0d8ddfc281919d7ee", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.845942441365152, "ground_truth": 0}, {"key": "bb1e2c23f3fc6edb0ee4bed365cb5567c87a5aa9", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.7534666570471861, "ground_truth": 0}, {"key": "bb1e2c23f3fc6edb0ee4bed365cb5567c87a5aa9", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.8449215246993184, "ground_truth": 0}, {"key": "bb1e2c23f3fc6edb0ee4bed365cb5567c87a5aa9", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.8116760226760275, "ground_truth": 0}, {"key": "bb1e2c23f3fc6edb0ee4bed365cb5567c87a5aa9", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.7476159432391956, "ground_truth": 0}, {"key": "bb1e2c23f3fc6edb0ee4bed365cb5567c87a5aa9", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.8615382147014145, "ground_truth": 0}, {"key": "7c72b57e65ddefc77362ed64f7dbc0aebb87ac81", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.9511422197433048, "ground_truth": 0}, {"key": "7c72b57e65ddefc77362ed64f7dbc0aebb87ac81", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.9771973621587002, "ground_truth": 0}, {"key": "7c72b57e65ddefc77362ed64f7dbc0aebb87ac81", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.9525741292504688, "ground_truth": 0}, {"key": "7c72b57e65ddefc77362ed64f7dbc0aebb87ac81", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.928408801590475, "ground_truth": 0}, {"key": "7c72b57e65ddefc77362ed64f7dbc0aebb87ac81", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.9924812817251202, "ground_truth": 0}, {"key": "37a335b36b8d2472825c4624e5449b995726b7a3", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.7931059560323416, "ground_truth": 0}, {"key": "37a335b36b8d2472825c4624e5449b995726b7a3", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.778649318397245, "ground_truth": 0}, {"key": "37a335b36b8d2472825c4624e5449b995726b7a3", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.7416740312043631, "ground_truth": 0}, {"key": "37a335b36b8d2472825c4624e5449b995726b7a3", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.8006919821844974, "ground_truth": 0}, {"key": "37a335b36b8d2472825c4624e5449b995726b7a3", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.903974506063442, "ground_truth": 0}, {"key": "da894eb6e5cc104f90ac65e8a124bfcfbfc6578d", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.7008948106781404, "ground_truth": 0}, {"key": "da894eb6e5cc104f90ac65e8a124bfcfbfc6578d", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.7025300431078002, "ground_truth": 0}, {"key": "da894eb6e5cc104f90ac65e8a124bfcfbfc6578d", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.6859494502247283, "ground_truth": 0}, {"key": "da894eb6e5cc104f90ac65e8a124bfcfbfc6578d", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.7772998612162977, "ground_truth": 0}, {"key": "da894eb6e5cc104f90ac65e8a124bfcfbfc6578d", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.8519528146505563, "ground_truth": 0}, {"key": "b7697e424512e656efe5f2aca17bc33cfe0a2b20", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.7534666281157505, "ground_truth": 0}, {"key": "b7697e424512e656efe5f2aca17bc33cfe0a2b20", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.7341195245313328, "ground_truth": 0}, {"key": "b7697e424512e656efe5f2aca17bc33cfe0a2b20", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.8568123033208807, "ground_truth": 0}, {"key": "b7697e424512e656efe5f2aca17bc33cfe0a2b20", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.8519528184515823, "ground_truth": 0}, {"key": "b7697e424512e656efe5f2aca17bc33cfe0a2b20", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.7662936496855524, "ground_truth": 0}, {"key": "2292d4348e59aafbe93f3040af23fdff448a6cac", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.8080672114682103, "ground_truth": 0}, {"key": "2292d4348e59aafbe93f3040af23fdff448a6cac", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.9407897495644266, "ground_truth": 0}, {"key": "2292d4348e59aafbe93f3040af23fdff448a6cac", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.916109615600967, "ground_truth": 0}, {"key": "2292d4348e59aafbe93f3040af23fdff448a6cac", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.9130583433079863, "ground_truth": 0}, {"key": "2292d4348e59aafbe93f3040af23fdff448a6cac", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.9304582544850324, "ground_truth": 0}, {"key": "8ed7e0c5e15275537f2c1d5d945e95709d7dc6bf", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.8175744728881709, "ground_truth": 0}, {"key": "8ed7e0c5e15275537f2c1d5d945e95709d7dc6bf", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.6601723744961906, "ground_truth": 0}, {"key": "8ed7e0c5e15275537f2c1d5d945e95709d7dc6bf", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.7799929053267037, "ground_truth": 0}, {"key": "8ed7e0c5e15275537f2c1d5d945e95709d7dc6bf", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.7676898384347328, "ground_truth": 0}, {"key": "8ed7e0c5e15275537f2c1d5d945e95709d7dc6bf", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.7341195114019834, "ground_truth": 0}, {"key": "6b22be31a2cefb2fdd302b8ff788335f23f5dbad", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.8587185863046072, "ground_truth": 0}, {"key": "6b22be31a2cefb2fdd302b8ff788335f23f5dbad", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.7371581419144377, "ground_truth": 0}, {"key": "6b22be31a2cefb2fdd302b8ff788335f23f5dbad", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.7371581359028436, "ground_truth": 0}, {"key": "6b22be31a2cefb2fdd302b8ff788335f23f5dbad", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.7969253590016627, "ground_truth": 0}, {"key": "6b22be31a2cefb2fdd302b8ff788335f23f5dbad", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.5926666087449901, "ground_truth": 0}, {"key": "686caba1039a286aca406e0bbac00aebb198fda5", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.8856314709911209, "ground_truth": 0}, {"key": "686caba1039a286aca406e0bbac00aebb198fda5", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.9053222983675167, "ground_truth": 0}, {"key": "686caba1039a286aca406e0bbac00aebb198fda5", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.8140527887523187, "ground_truth": 0}, {"key": "686caba1039a286aca406e0bbac00aebb198fda5", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.8489721920288961, "ground_truth": 0}, {"key": "686caba1039a286aca406e0bbac00aebb198fda5", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.8469578371942794, "ground_truth": 0}, {"key": "3c84e13d5941fdbe626183cdf1dca9b5df6c8f92", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.8568122959507379, "ground_truth": 0}, {"key": "3c84e13d5941fdbe626183cdf1dca9b5df6c8f92", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.8661325016924973, "ground_truth": 0}, {"key": "3c84e13d5941fdbe626183cdf1dca9b5df6c8f92", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.8519527990480402, "ground_truth": 0}, {"key": "3c84e13d5941fdbe626183cdf1dca9b5df6c8f92", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.9334308144515457, "ground_truth": 0}, {"key": "3c84e13d5941fdbe626183cdf1dca9b5df6c8f92", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.8783142457851107, "ground_truth": 0}, {"key": "7f5fd7614f32586747f65545bebba418c3679d12", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.7008948014146995, "ground_truth": 0}, {"key": "7f5fd7614f32586747f65545bebba418c3679d12", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.8152324959405042, "ground_truth": 0}, {"key": "7f5fd7614f32586747f65545bebba418c3679d12", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.7170118742676744, "ground_truth": 0}, {"key": "7f5fd7614f32586747f65545bebba418c3679d12", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.6352224459501169, "ground_truth": 0}, {"key": "7f5fd7614f32586747f65545bebba418c3679d12", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.6959583437739223, "ground_truth": 0}, {"key": "186210bbc060c272ff9a2412ec2e711a3e4a5e6e", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.653126915233435, "ground_truth": 0}, {"key": "186210bbc060c272ff9a2412ec2e711a3e4a5e6e", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.861538200351851, "ground_truth": 0}, {"key": "186210bbc060c272ff9a2412ec2e711a3e4a5e6e", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.8365545580304021, "ground_truth": 0}, {"key": "186210bbc060c272ff9a2412ec2e711a3e4a5e6e", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.6842640156682421, "ground_truth": 0}, {"key": "186210bbc060c272ff9a2412ec2e711a3e4a5e6e", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.6774740301844099, "ground_truth": 0}, {"key": "03392835ea832d7940082c421a21778c70701ff0", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.7341195152116547, "ground_truth": 0}, {"key": "03392835ea832d7940082c421a21778c70701ff0", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.861538200351851, "ground_truth": 0}, {"key": "03392835ea832d7940082c421a21778c70701ff0", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.5467381315479167, "ground_truth": 0}, {"key": "03392835ea832d7940082c421a21778c70701ff0", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.7634837694459167, "ground_truth": 0}, {"key": "03392835ea832d7940082c421a21778c70701ff0", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.6723316896278632, "ground_truth": 0}, {"key": "e2b96982b60cbd10b39c1db4282023d0ac1f3f2a", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.9273632906422072, "ground_truth": 0}, {"key": "e2b96982b60cbd10b39c1db4282023d0ac1f3f2a", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.8587185841038714, "ground_truth": 0}, {"key": "e2b96982b60cbd10b39c1db4282023d0ac1f3f2a", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.8872046046981852, "ground_truth": 0}, {"key": "e2b96982b60cbd10b39c1db4282023d0ac1f3f2a", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.9257686335972602, "ground_truth": 0}, {"key": "e2b96982b60cbd10b39c1db4282023d0ac1f3f2a", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.8499711756094693, "ground_truth": 0}, {"key": "31310358d02c98abba71916e8cb4ef7477a2d82a", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.6187804267849158, "ground_truth": 0}, {"key": "31310358d02c98abba71916e8cb4ef7477a2d82a", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.8529354879942014, "ground_truth": 0}, {"key": "31310358d02c98abba71916e8cb4ef7477a2d82a", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.6531269178097959, "ground_truth": 0}, {"key": "31310358d02c98abba71916e8cb4ef7477a2d82a", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.6859494510635357, "ground_truth": 0}, {"key": "31310358d02c98abba71916e8cb4ef7477a2d82a", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.7563575577601861, "ground_truth": 0}, {"key": "ec0e9a0c77bbb4bba73ef5177413c666e691850d", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.8044059079587846, "ground_truth": 0}, {"key": "ec0e9a0c77bbb4bba73ef5177413c666e691850d", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.9407897495644266, "ground_truth": 0}, {"key": "ec0e9a0c77bbb4bba73ef5177413c666e691850d", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.9462003541061972, "ground_truth": 0}, {"key": "ec0e9a0c77bbb4bba73ef5177413c666e691850d", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.9515039984080876, "ground_truth": 0}, {"key": "ec0e9a0c77bbb4bba73ef5177413c666e691850d", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.9263037265499995, "ground_truth": 0}, {"key": "02311be4aab97a81d2262963896b975c27f6503d", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.9257686331921204, "ground_truth": 0}, {"key": "02311be4aab97a81d2262963896b975c27f6503d", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.905322291881627, "ground_truth": 0}, {"key": "02311be4aab97a81d2262963896b975c27f6503d", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.9728307676115384, "ground_truth": 0}, {"key": "02311be4aab97a81d2262963896b975c27f6503d", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.9500414759590878, "ground_truth": 0}, {"key": "02311be4aab97a81d2262963896b975c27f6503d", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.9263037215427311, "ground_truth": 0}, {"key": "a18b463219c663ef55a0cbbf81ae489cdf877b62", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.9700134906832948, "ground_truth": 0}, {"key": "a18b463219c663ef55a0cbbf81ae489cdf877b62", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.9912886157963816, "ground_truth": 0}, {"key": "a18b463219c663ef55a0cbbf81ae489cdf877b62", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.9905874103708654, "ground_truth": 0}, {"key": "a18b463219c663ef55a0cbbf81ae489cdf877b62", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.9923043527510662, "ground_truth": 0}, {"key": "a18b463219c663ef55a0cbbf81ae489cdf877b62", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.9893474881578593, "ground_truth": 0}, {"key": "aa966ac9e3611ac2cef8d3fb9ceb3b58c150e238", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.9575961735953141, "ground_truth": 0}, {"key": "aa966ac9e3611ac2cef8d3fb9ceb3b58c150e238", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.966410492601554, "ground_truth": 0}, {"key": "aa966ac9e3611ac2cef8d3fb9ceb3b58c150e238", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.9304582575225349, "ground_truth": 0}, {"key": "aa966ac9e3611ac2cef8d3fb9ceb3b58c150e238", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.890294232173464, "ground_truth": 0}, {"key": "aa966ac9e3611ac2cef8d3fb9ceb3b58c150e238", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.8354835389687911, "ground_truth": 0}, {"key": "5215d4e6e945ba390786f1720cc5a8abf92c32fd", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.8558511450871507, "ground_truth": 0}, {"key": "5215d4e6e945ba390786f1720cc5a8abf92c32fd", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.7279754594500171, "ground_truth": 0}, {"key": "5215d4e6e945ba390786f1720cc5a8abf92c32fd", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.7994423322762354, "ground_truth": 0}, {"key": "5215d4e6e945ba390786f1720cc5a8abf92c32fd", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.7853085878742938, "ground_truth": 0}, {"key": "5215d4e6e945ba390786f1720cc5a8abf92c32fd", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.835483535973001, "ground_truth": 0}, {"key": "e7297f59909379c8eb07ea9bc2377b5e3980073d", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.6601723669150764, "ground_truth": 0}, {"key": "e7297f59909379c8eb07ea9bc2377b5e3980073d", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.778649318397245, "ground_truth": 0}, {"key": "e7297f59909379c8eb07ea9bc2377b5e3980073d", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.8652240838394853, "ground_truth": 0}, {"key": "e7297f59909379c8eb07ea9bc2377b5e3980073d", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.8529354698548716, "ground_truth": 0}, {"key": "e7297f59909379c8eb07ea9bc2377b5e3980073d", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.903974506063442, "ground_truth": 0}, {"key": "6c5f775006a225e617c1fa4cf0c439579e1443a2", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.8164064004744312, "ground_truth": 0}, {"key": "6c5f775006a225e617c1fa4cf0c439579e1443a2", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.902609594477782, "ground_truth": 0}, {"key": "6c5f775006a225e617c1fa4cf0c439579e1443a2", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.867933838071515, "ground_truth": 0}, {"key": "6c5f775006a225e617c1fa4cf0c439579e1443a2", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.7704648105048855, "ground_truth": 0}, {"key": "6c5f775006a225e617c1fa4cf0c439579e1443a2", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.7786493197674783, "ground_truth": 0}, {"key": "46ce664a42eac4474d25c435a28790ec25137603", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.8300437650336588, "ground_truth": 0}, {"key": "46ce664a42eac4474d25c435a28790ec25137603", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.8068526187419117, "ground_truth": 0}, {"key": "46ce664a42eac4474d25c435a28790ec25137603", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.8925625288343733, "ground_truth": 0}, {"key": "46ce664a42eac4474d25c435a28790ec25137603", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.8386797632045508, "ground_truth": 0}, {"key": "46ce664a42eac4474d25c435a28790ec25137603", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.7745833860327516, "ground_truth": 0}, {"key": "693d73ab049f7d8f3c897922b3f7269a96a1a4fa", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.7892337030189832, "ground_truth": 0}, {"key": "693d73ab049f7d8f3c897922b3f7269a96a1a4fa", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.7264256087751674, "ground_truth": 0}, {"key": "693d73ab049f7d8f3c897922b3f7269a96a1a4fa", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.7490872215140915, "ground_truth": 0}, {"key": "693d73ab049f7d8f3c897922b3f7269a96a1a4fa", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.8233284039949051, "ground_truth": 0}, {"key": "693d73ab049f7d8f3c897922b3f7269a96a1a4fa", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.8221891283431723, "ground_truth": 0}, {"key": "48e4930e3c380330b609f460f11520be0e29d5fd", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.8774767872512479, "ground_truth": 0}, {"key": "48e4930e3c380330b609f460f11520be0e29d5fd", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.8652240822063841, "ground_truth": 0}, {"key": "48e4930e3c380330b609f460f11520be0e29d5fd", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.8947894664711122, "ground_truth": 0}, {"key": "48e4930e3c380330b609f460f11520be0e29d5fd", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.9381240095805393, "ground_truth": 0}, {"key": "48e4930e3c380330b609f460f11520be0e29d5fd", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.9453993937487478, "ground_truth": 0}, {"key": "53f3e11ada213ff55b987692a2eb0c9b6d890d5e", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.8386797620331223, "ground_truth": 0}, {"key": "53f3e11ada213ff55b987692a2eb0c9b6d890d5e", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.7879312020783756, "ground_truth": 0}, {"key": "53f3e11ada213ff55b987692a2eb0c9b6d890d5e", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.6757645942320966, "ground_truth": 0}, {"key": "53f3e11ada213ff55b987692a2eb0c9b6d890d5e", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.8056321911932505, "ground_truth": 0}, {"key": "53f3e11ada213ff55b987692a2eb0c9b6d890d5e", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.7138307713336901, "ground_truth": 0}, {"key": "d2ee859acf7e35bea229f968d53240c2f1c2845c", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.8128673215909683, "ground_truth": 0}, {"key": "d2ee859acf7e35bea229f968d53240c2f1c2845c", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.9124361565919398, "ground_truth": 0}, {"key": "d2ee859acf7e35bea229f968d53240c2f1c2845c", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.8187367978312002, "ground_truth": 0}, {"key": "d2ee859acf7e35bea229f968d53240c2f1c2845c", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.9167080723170377, "ground_truth": 0}, {"key": "d2ee859acf7e35bea229f968d53240c2f1c2845c", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.8918110385013057, "ground_truth": 0}, {"key": "d4d44650eb77504fd01a730c0ccc7e6cdfcc578a", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.697608924262414, "ground_truth": 0}, {"key": "d4d44650eb77504fd01a730c0ccc7e6cdfcc578a", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.8210441045297908, "ground_truth": 0}, {"key": "d4d44650eb77504fd01a730c0ccc7e6cdfcc578a", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.8643104504334715, "ground_truth": 0}, {"key": "d4d44650eb77504fd01a730c0ccc7e6cdfcc578a", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.8479677505995563, "ground_truth": 0}, {"key": "d4d44650eb77504fd01a730c0ccc7e6cdfcc578a", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.8539127541021689, "ground_truth": 0}, {"key": "3695132378151f89d210da575bfef0a3f29aa051", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.8910549633518124, "ground_truth": 0}, {"key": "3695132378151f89d210da575bfef0a3f29aa051", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.9213576153391257, "ground_truth": 0}, {"key": "3695132378151f89d210da575bfef0a3f29aa051", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.9477691470273658, "ground_truth": 0}, {"key": "3695132378151f89d210da575bfef0a3f29aa051", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.944587205896201, "ground_truth": 0}, {"key": "3695132378151f89d210da575bfef0a3f29aa051", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.9278877938800225, "ground_truth": 0}, {"key": "c193cecd478fa204b16500ece25bf25b75bc5265", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.896251369094964, "ground_truth": 0}, {"key": "c193cecd478fa204b16500ece25bf25b75bc5265", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.9136765241075251, "ground_truth": 0}, {"key": "c193cecd478fa204b16500ece25bf25b75bc5265", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.8902942283110703, "ground_truth": 0}, {"key": "c193cecd478fa204b16500ece25bf25b75bc5265", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.9161096123813933, "ground_truth": 0}, {"key": "c193cecd478fa204b16500ece25bf25b75bc5265", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.9294404054820733, "ground_truth": 0}, {"key": "b599d61b0c28b86dc92c7af4d40814ece8279500", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.9353465104716537, "ground_truth": 0}, {"key": "b599d61b0c28b86dc92c7af4d40814ece8279500", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.8019358418224982, "ground_truth": 0}, {"key": "b599d61b0c28b86dc92c7af4d40814ece8279500", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.8116760209687542, "ground_truth": 0}, {"key": "b599d61b0c28b86dc92c7af4d40814ece8279500", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.836554567644394, "ground_truth": 0}, {"key": "b599d61b0c28b86dc92c7af4d40814ece8279500", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.6909762845328559, "ground_truth": 0}, {"key": "06f290a163e81c46437ca61b5fd13741d7db11f2", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.738669072893831, "ground_truth": 0}, {"key": "06f290a163e81c46437ca61b5fd13741d7db11f2", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.544801379944157, "ground_truth": 0}, {"key": "06f290a163e81c46437ca61b5fd13741d7db11f2", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.5019531082425218, "ground_truth": 0}, {"key": "06f290a163e81c46437ca61b5fd13741d7db11f2", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.5832033509802652, "ground_truth": 0}, {"key": "06f290a163e81c46437ca61b5fd13741d7db11f2", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.6460137077685651, "ground_truth": 0}, {"key": "46210bd0b15cd5bba64751d873674766decb2677", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.8489721998345076, "ground_truth": 0}, {"key": "46210bd0b15cd5bba64751d873674766decb2677", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.916109616297079, "ground_truth": 0}, {"key": "46210bd0b15cd5bba64751d873674766decb2677", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.8164063723101886, "ground_truth": 0}, {"key": "46210bd0b15cd5bba64751d873674766decb2677", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.7892337062902237, "ground_truth": 0}, {"key": "46210bd0b15cd5bba64751d873674766decb2677", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.819893334115687, "ground_truth": 0}, {"key": "cfba701dad16c47e0f7b97b8a6b043d25f740085", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.8210441024928099, "ground_truth": 0}, {"key": "cfba701dad16c47e0f7b97b8a6b043d25f740085", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.8198933313672568, "ground_truth": 0}, {"key": "cfba701dad16c47e0f7b97b8a6b043d25f740085", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.8633916055093664, "ground_truth": 0}, {"key": "cfba701dad16c47e0f7b97b8a6b043d25f740085", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.8300437627240763, "ground_truth": 0}, {"key": "cfba701dad16c47e0f7b97b8a6b043d25f740085", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.7549149903444152, "ground_truth": 0}, {"key": "1c0fbe7e6758334d83d145580688e7aa1c549c53", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.7401743444824044, "ground_truth": 0}, {"key": "1c0fbe7e6758334d83d145580688e7aa1c549c53", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.7520125719234383, "ground_truth": 0}, {"key": "1c0fbe7e6758334d83d145580688e7aa1c549c53", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.8333245927961846, "ground_truth": 0}, {"key": "1c0fbe7e6758334d83d145580688e7aa1c549c53", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.7025300576667204, "ground_truth": 0}, {"key": "1c0fbe7e6758334d83d145580688e7aa1c549c53", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.6424324712964923, "ground_truth": 0}, {"key": "820c917dada8b32be365eaeec9edc1ca5833cfcd", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.9294404026091073, "ground_truth": 0}, {"key": "820c917dada8b32be365eaeec9edc1ca5833cfcd", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.8679338568809286, "ground_truth": 0}, {"key": "820c917dada8b32be365eaeec9edc1ca5833cfcd", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.918480247740544, "ground_truth": 0}, {"key": "820c917dada8b32be365eaeec9edc1ca5833cfcd", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.939470609386153, "ground_truth": 0}, {"key": "820c917dada8b32be365eaeec9edc1ca5833cfcd", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.8925625313709096, "ground_truth": 0}, {"key": "faf3821150b0c63290cbbddd7a8b54900995ea5a", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.5621764896494892, "ground_truth": 0}, {"key": "faf3821150b0c63290cbbddd7a8b54900995ea5a", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.7662936552220749, "ground_truth": 0}, {"key": "faf3821150b0c63290cbbddd7a8b54900995ea5a", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.7356416402833477, "ground_truth": 0}, {"key": "faf3821150b0c63290cbbddd7a8b54900995ea5a", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.7718434964788006, "ground_truth": 0}, {"key": "faf3821150b0c63290cbbddd7a8b54900995ea5a", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.7170118554536626, "ground_truth": 0}, {"key": "1de0cae2832cf41f49e6fad8254247c789dfabd2", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.7813306296891498, "ground_truth": 0}, {"key": "1de0cae2832cf41f49e6fad8254247c789dfabd2", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.7981867739333801, "ground_truth": 0}, {"key": "1de0cae2832cf41f49e6fad8254247c789dfabd2", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.6531269397168202, "ground_truth": 0}, {"key": "1de0cae2832cf41f49e6fad8254247c789dfabd2", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.8267117859816926, "ground_truth": 0}, {"key": "1de0cae2832cf41f49e6fad8254247c789dfabd2", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.6477982011049558, "ground_truth": 0}, {"key": "6c6e51ef20def117ed9114ed8d8480b3a100f1c3", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.7839884774528765, "ground_truth": 0}, {"key": "6c6e51ef20def117ed9114ed8d8480b3a100f1c3", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.7371581637443833, "ground_truth": 0}, {"key": "6c6e51ef20def117ed9114ed8d8480b3a100f1c3", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.7772998591414707, "ground_truth": 0}, {"key": "6c6e51ef20def117ed9114ed8d8480b3a100f1c3", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.870597270532885, "ground_truth": 0}, {"key": "6c6e51ef20def117ed9114ed8d8480b3a100f1c3", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.7732163851057783, "ground_truth": 0}, {"key": "b8c755b8921f7917d161605d2ef404d9551f3846", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.826711796220598, "ground_truth": 0}, {"key": "b8c755b8921f7917d161605d2ef404d9551f3846", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.6774740032948389, "ground_truth": 0}, {"key": "b8c755b8921f7917d161605d2ef404d9551f3846", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.9184802535020052, "ground_truth": 0}, {"key": "b8c755b8921f7917d161605d2ef404d9551f3846", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.8969755681834788, "ground_truth": 0}, {"key": "b8c755b8921f7917d161605d2ef404d9551f3846", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.8774767831915667, "ground_truth": 0}, {"key": "dc7e18d14b8ad29abbd79f554324ec7b8ba8b9c0", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.8783142417707485, "ground_truth": 0}, {"key": "dc7e18d14b8ad29abbd79f554324ec7b8ba8b9c0", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.8962513749479393, "ground_truth": 0}, {"key": "dc7e18d14b8ad29abbd79f554324ec7b8ba8b9c0", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.9073122281400738, "ground_truth": 0}, {"key": "dc7e18d14b8ad29abbd79f554324ec7b8ba8b9c0", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.8766343691410675, "ground_truth": 0}, {"key": "dc7e18d14b8ad29abbd79f554324ec7b8ba8b9c0", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.9485372354468774, "ground_truth": 0}, {"key": "a7fc90db6c296663b1b7fc057451dfd45019342d", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.6406358642243593, "ground_truth": 0}, {"key": "a7fc90db6c296663b1b7fc057451dfd45019342d", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.689305593610658, "ground_truth": 0}, {"key": "a7fc90db6c296663b1b7fc057451dfd45019342d", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.7122321934496609, "ground_truth": 0}, {"key": "a7fc90db6c296663b1b7fc057451dfd45019342d", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.4824291128688716, "ground_truth": 0}, {"key": "a7fc90db6c296663b1b7fc057451dfd45019342d", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.5175708817202582, "ground_truth": 0}, {"key": "7f22fbc4fd81e50c632c5853856965aa4d0065d4", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.894789462643689, "ground_truth": 0}, {"key": "7f22fbc4fd81e50c632c5853856965aa4d0065d4", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.9155072429932436, "ground_truth": 0}, {"key": "7f22fbc4fd81e50c632c5853856965aa4d0065d4", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.8587185879546979, "ground_truth": 0}, {"key": "7f22fbc4fd81e50c632c5853856965aa4d0065d4", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.8459424447414942, "ground_truth": 0}, {"key": "7f22fbc4fd81e50c632c5853856965aa4d0065d4", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.8910549559314589, "ground_truth": 0}, {"key": "309ae632df7b88a9569d81fa91aff3b9fb03529e", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.7892337152914877, "ground_truth": 0}, {"key": "309ae632df7b88a9569d81fa91aff3b9fb03529e", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.8652240834489187, "ground_truth": 0}, {"key": "309ae632df7b88a9569d81fa91aff3b9fb03529e", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.889528851014392, "ground_truth": 0}, {"key": "309ae632df7b88a9569d81fa91aff3b9fb03529e", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.8080672060087498, "ground_truth": 0}, {"key": "309ae632df7b88a9569d81fa91aff3b9fb03529e", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.7772998478846638, "ground_truth": 0}, {"key": "732304a0901ff14d023d4361c1d41a85724808f3", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.7041601273447335, "ground_truth": 0}, {"key": "732304a0901ff14d023d4361c1d41a85724808f3", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.8044059175567893, "ground_truth": 0}, {"key": "732304a0901ff14d023d4361c1d41a85724808f3", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.607663203380789, "ground_truth": 0}, {"key": "732304a0901ff14d023d4361c1d41a85724808f3", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.8116760262796596, "ground_truth": 0}, {"key": "732304a0901ff14d023d4361c1d41a85724808f3", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.7233094725367794, "ground_truth": 0}, {"key": "509b9f69b376e4acb8da49d53198699b1e779ea7", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.712232189980606, "ground_truth": 0}, {"key": "509b9f69b376e4acb8da49d53198699b1e779ea7", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.8233283950344443, "ground_truth": 0}, {"key": "509b9f69b376e4acb8da49d53198699b1e779ea7", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.7634837634817657, "ground_truth": 0}, {"key": "509b9f69b376e4acb8da49d53198699b1e779ea7", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.8244619366329388, "ground_truth": 0}, {"key": "509b9f69b376e4acb8da49d53198699b1e779ea7", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.6791786833731134, "ground_truth": 0}, {"key": "c292860b41f7c9131458cdc44a79febef38ad8a2", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.6893056232530099, "ground_truth": 0}, {"key": "c292860b41f7c9131458cdc44a79febef38ad8a2", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.849971173754365, "ground_truth": 0}, {"key": "c292860b41f7c9131458cdc44a79febef38ad8a2", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.5926665978894731, "ground_truth": 0}, {"key": "c292860b41f7c9131458cdc44a79febef38ad8a2", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.7401743393399979, "ground_truth": 0}, {"key": "c292860b41f7c9131458cdc44a79febef38ad8a2", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.8714748720972639, "ground_truth": 0}, {"key": "6db7e70883f0241081833487c421bab86fdac26e", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.7732163733325972, "ground_truth": 0}, {"key": "6db7e70883f0241081833487c421bab86fdac26e", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.7490872123144297, "ground_truth": 0}, {"key": "6db7e70883f0241081833487c421bab86fdac26e", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.798186776413056, "ground_truth": 0}, {"key": "6db7e70883f0241081833487c421bab86fdac26e", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.822189129966828, "ground_truth": 0}, {"key": "6db7e70883f0241081833487c421bab86fdac26e", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.8116760139734142, "ground_truth": 0}, {"key": "e51e06234b3f49da16fec69aaee6fb9cd09cb1d8", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.7634837636866345, "ground_truth": 0}, {"key": "e51e06234b3f49da16fec69aaee6fb9cd09cb1d8", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.7799929066992562, "ground_truth": 0}, {"key": "e51e06234b3f49da16fec69aaee6fb9cd09cb1d8", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.7217432140519706, "ground_truth": 0}, {"key": "e51e06234b3f49da16fec69aaee6fb9cd09cb1d8", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.6825737165847171, "ground_truth": 0}, {"key": "e51e06234b3f49da16fec69aaee6fb9cd09cb1d8", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.8019358273292594, "ground_truth": 0}, {"key": "42474528588bac3a27842671a3fa940fed450552", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.9235923206365898, "ground_truth": 0}, {"key": "42474528588bac3a27842671a3fa940fed450552", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.7879311939879535, "ground_truth": 0}, {"key": "42474528588bac3a27842671a3fa940fed450552", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.8783142496768616, "ground_truth": 0}, {"key": "42474528588bac3a27842671a3fa940fed450552", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.8080672137216065, "ground_truth": 0}, {"key": "42474528588bac3a27842671a3fa940fed450552", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.8019358275385511, "ground_truth": 0}, {"key": "5932d9c8f1da55bad396197ebae0853c515180a5", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.9073122267862643, "ground_truth": 0}, {"key": "5932d9c8f1da55bad396197ebae0853c515180a5", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.6187804365067783, "ground_truth": 0}, {"key": "5932d9c8f1da55bad396197ebae0853c515180a5", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.7981867669810164, "ground_truth": 0}, {"key": "5932d9c8f1da55bad396197ebae0853c515180a5", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.8864204122129795, "ground_truth": 0}, {"key": "5932d9c8f1da55bad396197ebae0853c515180a5", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.8615382073292119, "ground_truth": 0}, {"key": "daacc676fc659bfd147d11b1409ab42615a2f169", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.8407825949084745, "ground_truth": 0}, {"key": "daacc676fc659bfd147d11b1409ab42615a2f169", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.8221891157214909, "ground_truth": 0}, {"key": "daacc676fc659bfd147d11b1409ab42615a2f169", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.7879311959588317, "ground_truth": 0}, {"key": "daacc676fc659bfd147d11b1409ab42615a2f169", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.848972204603765, "ground_truth": 0}, {"key": "daacc676fc659bfd147d11b1409ab42615a2f169", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.8322366593643019, "ground_truth": 0}, {"key": "7a02e707b139791920fb13115d6132541fff7d97", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.680878610146386, "ground_truth": 0}, {"key": "7a02e707b139791920fb13115d6132541fff7d97", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.7839884768034011, "ground_truth": 0}, {"key": "7a02e707b139791920fb13115d6132541fff7d97", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.5525396989358626, "ground_truth": 0}, {"key": "7a02e707b139791920fb13115d6132541fff7d97", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.6242935242896701, "ground_truth": 0}, {"key": "7a02e707b139791920fb13115d6132541fff7d97", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.7490872049855317, "ground_truth": 0}, {"key": "db1972f0204c7a9c292f4c85e8838251cb26625e", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.8140527951765342, "ground_truth": 0}, {"key": "db1972f0204c7a9c292f4c85e8838251cb26625e", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.8267117946477571, "ground_truth": 0}, {"key": "db1972f0204c7a9c292f4c85e8838251cb26625e", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.9118099545330902, "ground_truth": 0}, {"key": "db1972f0204c7a9c292f4c85e8838251cb26625e", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.8984105484944458, "ground_truth": 0}, {"key": "db1972f0204c7a9c292f4c85e8838251cb26625e", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.9582261219242517, "ground_truth": 0}, {"key": "6defcdfd6995661fd681dc15163d67f6a5d6727b", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.9425067219054444, "ground_truth": 0}, {"key": "6defcdfd6995661fd681dc15163d67f6a5d6727b", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.9012274046099118, "ground_truth": 0}, {"key": "6defcdfd6995661fd681dc15163d67f6a5d6727b", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.8872045972691673, "ground_truth": 0}, {"key": "6defcdfd6995661fd681dc15163d67f6a5d6727b", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.9425067193376119, "ground_truth": 0}, {"key": "6defcdfd6995661fd681dc15163d67f6a5d6727b", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.9367494754213157, "ground_truth": 0}, {"key": "24716f5a39d23dafbe9a9df8fa002788d14d020b", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.9019206762571305, "ground_truth": 0}, {"key": "24716f5a39d23dafbe9a9df8fa002788d14d020b", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.8976952955533416, "ground_truth": 0}, {"key": "24716f5a39d23dafbe9a9df8fa002788d14d020b", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.8080672032421296, "ground_truth": 0}, {"key": "24716f5a39d23dafbe9a9df8fa002788d14d020b", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.8615382027059347, "ground_truth": 0}, {"key": "24716f5a39d23dafbe9a9df8fa002788d14d020b", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.8140527960447193, "ground_truth": 0}, {"key": "ab3c98cf7833b842898a568d872e45ceb2f7dda9", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.7676898463702766, "ground_truth": 0}, {"key": "ab3c98cf7833b842898a568d872e45ceb2f7dda9", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.8175744744357858, "ground_truth": 0}, {"key": "ab3c98cf7833b842898a568d872e45ceb2f7dda9", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.6671476616613471, "ground_truth": 0}, {"key": "ab3c98cf7833b842898a568d872e45ceb2f7dda9", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.8164063806004557, "ground_truth": 0}, {"key": "ab3c98cf7833b842898a568d872e45ceb2f7dda9", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.7577943764975705, "ground_truth": 0}, {"key": "831005755f85012c882f17c3b3699b34a7febb7b", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.8606036231718589, "ground_truth": 0}, {"key": "831005755f85012c882f17c3b3699b34a7febb7b", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.9362850061255074, "ground_truth": 0}, {"key": "831005755f85012c882f17c3b3699b34a7febb7b", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.9241418204319769, "ground_truth": 0}, {"key": "831005755f85012c882f17c3b3699b34a7febb7b", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.940353063397837, "ground_truth": 0}, {"key": "831005755f85012c882f17c3b3699b34a7febb7b", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.7310585770768891, "ground_truth": 0}, {"key": "0590a8c653b7d332d9df195dcf3ce014abb4eff7", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.8354835537142893, "ground_truth": 0}, {"key": "0590a8c653b7d332d9df195dcf3ce014abb4eff7", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.8816149051838156, "ground_truth": 0}, {"key": "0590a8c653b7d332d9df195dcf3ce014abb4eff7", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.8757869922353191, "ground_truth": 0}, {"key": "0590a8c653b7d332d9df195dcf3ce014abb4eff7", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.8019358377779188, "ground_truth": 0}, {"key": "0590a8c653b7d332d9df195dcf3ce014abb4eff7", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.9053223015846482, "ground_truth": 0}, {"key": "f79341438eed40986c3219b67a3b5d87eb6c018a", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.9500414726850717, "ground_truth": 0}, {"key": "f79341438eed40986c3219b67a3b5d87eb6c018a", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.9536217933991152, "ground_truth": 0}, {"key": "f79341438eed40986c3219b67a3b5d87eb6c018a", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.9629528295540178, "ground_truth": 0}, {"key": "f79341438eed40986c3219b67a3b5d87eb6c018a", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.9726235110798455, "ground_truth": 0}, {"key": "f79341438eed40986c3219b67a3b5d87eb6c018a", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.9500414765702044, "ground_truth": 0}, {"key": "8db6225f67580d64a196f2f3197386a6be950a09", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.9867771789092021, "ground_truth": 0}, {"key": "8db6225f67580d64a196f2f3197386a6be950a09", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.9768465902733117, "ground_truth": 0}, {"key": "8db6225f67580d64a196f2f3197386a6be950a09", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.9606574977365573, "ground_truth": 0}, {"key": "8db6225f67580d64a196f2f3197386a6be950a09", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.9777138132323538, "ground_truth": 0}, {"key": "8db6225f67580d64a196f2f3197386a6be950a09", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.9777138141656675, "ground_truth": 0}, {"key": "e386d9ed70bac668fa6048b572f445d9b7b62f75", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.7170118679595384, "ground_truth": 0}, {"key": "e386d9ed70bac668fa6048b572f445d9b7b62f75", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.8799743643276415, "ground_truth": 0}, {"key": "e386d9ed70bac668fa6048b572f445d9b7b62f75", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.8643104584588712, "ground_truth": 0}, {"key": "e386d9ed70bac668fa6048b572f445d9b7b62f75", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.8697145768099994, "ground_truth": 0}, {"key": "e386d9ed70bac668fa6048b572f445d9b7b62f75", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.7233094755217405, "ground_truth": 0}, {"key": "e35669d4530ea55bc8f0e451268cab9e9eaeab92", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.7325918458396504, "ground_truth": 0}, {"key": "e35669d4530ea55bc8f0e451268cab9e9eaeab92", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.8006919915994901, "ground_truth": 0}, {"key": "e35669d4530ea55bc8f0e451268cab9e9eaeab92", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.7461389852845227, "ground_truth": 0}, {"key": "e35669d4530ea55bc8f0e451268cab9e9eaeab92", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.809275976612003, "ground_truth": 0}, {"key": "e35669d4530ea55bc8f0e451268cab9e9eaeab92", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.6723316991407806, "ground_truth": 0}, {"key": "d3ca193f45aef9aa766d52fbc58d6b8f1658ee60", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.7233094692953083, "ground_truth": 0}, {"key": "d3ca193f45aef9aa766d52fbc58d6b8f1658ee60", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.8732148264720352, "ground_truth": 0}, {"key": "d3ca193f45aef9aa766d52fbc58d6b8f1658ee60", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.8489721945408127, "ground_truth": 0}, {"key": "d3ca193f45aef9aa766d52fbc58d6b8f1658ee60", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.7690802481927039, "ground_truth": 0}, {"key": "d3ca193f45aef9aa766d52fbc58d6b8f1658ee60", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.8799743662262285, "ground_truth": 0}, {"key": "1ca9bf09bf534add02b7cfe6ebae6d17cde66286", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.83332459909601, "ground_truth": 0}, {"key": "1ca9bf09bf534add02b7cfe6ebae6d17cde66286", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.8714748626992621, "ground_truth": 0}, {"key": "1ca9bf09bf534add02b7cfe6ebae6d17cde66286", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.8386797773350365, "ground_truth": 0}, {"key": "1ca9bf09bf534add02b7cfe6ebae6d17cde66286", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.8376199669722683, "ground_truth": 0}, {"key": "1ca9bf09bf534add02b7cfe6ebae6d17cde66286", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.874934625461733, "ground_truth": 0}, {"key": "c296e88117bef515bd9b36ad560223df3fd2b84c", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.9079671344855361, "ground_truth": 0}, {"key": "c296e88117bef515bd9b36ad560223df3fd2b84c", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.6477982300902907, "ground_truth": 0}, {"key": "c296e88117bef515bd9b36ad560223df3fd2b84c", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.8848377697103592, "ground_truth": 0}, {"key": "c296e88117bef515bd9b36ad560223df3fd2b84c", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.8697145828240126, "ground_truth": 0}, {"key": "c296e88117bef515bd9b36ad560223df3fd2b84c", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.9367494743103236, "ground_truth": 0}, {"key": "c5e11ee4c2f0ae511bd0e1fae2978d070b1efc15", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.6959583250064737, "ground_truth": 0}, {"key": "c5e11ee4c2f0ae511bd0e1fae2978d070b1efc15", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.7718434935702005, "ground_truth": 0}, {"key": "c5e11ee4c2f0ae511bd0e1fae2978d070b1efc15", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.6723316875948911, "ground_truth": 0}, {"key": "c5e11ee4c2f0ae511bd0e1fae2978d070b1efc15", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.7905303101915996, "ground_truth": 0}, {"key": "c5e11ee4c2f0ae511bd0e1fae2978d070b1efc15", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.7446563522598965, "ground_truth": 0}, {"key": "1fc2d1ecf1ffdc2f0b642b686e1c21de53a4fd28", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.8300437546879026, "ground_truth": 0}, {"key": "1fc2d1ecf1ffdc2f0b642b686e1c21de53a4fd28", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.785308579487163, "ground_truth": 0}, {"key": "1fc2d1ecf1ffdc2f0b642b686e1c21de53a4fd28", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.8757869923446256, "ground_truth": 0}, {"key": "1fc2d1ecf1ffdc2f0b642b686e1c21de53a4fd28", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.8175744581856482, "ground_truth": 0}, {"key": "1fc2d1ecf1ffdc2f0b642b686e1c21de53a4fd28", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.8344068849365676, "ground_truth": 0}, {"key": "6556c64821ece8123c130b27285efe9619c3c7fd", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.7106282979641158, "ground_truth": 0}, {"key": "6556c64821ece8123c130b27285efe9619c3c7fd", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.6926419726050821, "ground_truth": 0}, {"key": "6556c64821ece8123c130b27285efe9619c3c7fd", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.8221891268150822, "ground_truth": 0}, {"key": "6556c64821ece8123c130b27285efe9619c3c7fd", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.7826624966483964, "ground_truth": 0}, {"key": "6556c64821ece8123c130b27285efe9619c3c7fd", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.8558511474456971, "ground_truth": 0}, {"key": "32ba61f4513f7ec21cedb6ddd2a8a93260f8cd56", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.7866228330170965, "ground_truth": 0}, {"key": "32ba61f4513f7ec21cedb6ddd2a8a93260f8cd56", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.9161096153809181, "ground_truth": 0}, {"key": "32ba61f4513f7ec21cedb6ddd2a8a93260f8cd56", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.87578698691383, "ground_truth": 0}, {"key": "32ba61f4513f7ec21cedb6ddd2a8a93260f8cd56", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.827828149650156, "ground_truth": 0}, {"key": "32ba61f4513f7ec21cedb6ddd2a8a93260f8cd56", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.8221891304109978, "ground_truth": 0}, {"key": "1146cfc5981ce23511ac1bac5f3957c30bebc7b8", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.7690802376751065, "ground_truth": 0}, {"key": "1146cfc5981ce23511ac1bac5f3957c30bebc7b8", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.9012274051310869, "ground_truth": 0}, {"key": "1146cfc5981ce23511ac1bac5f3957c30bebc7b8", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.8783142454562226, "ground_truth": 0}, {"key": "1146cfc5981ce23511ac1bac5f3957c30bebc7b8", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.884039291570881, "ground_truth": 0}, {"key": "1146cfc5981ce23511ac1bac5f3957c30bebc7b8", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.8799743695049457, "ground_truth": 0}, {"key": "e060abdb2a5e2ce6152ca0ed53703a9d17b2df36", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.7718434997281974, "ground_truth": 0}, {"key": "e060abdb2a5e2ce6152ca0ed53703a9d17b2df36", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.8164063676499551, "ground_truth": 0}, {"key": "e060abdb2a5e2ce6152ca0ed53703a9d17b2df36", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.769080250059881, "ground_truth": 0}, {"key": "e060abdb2a5e2ce6152ca0ed53703a9d17b2df36", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.8539127485739694, "ground_truth": 0}, {"key": "e060abdb2a5e2ce6152ca0ed53703a9d17b2df36", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.7520125725189151, "ground_truth": 0}, {"key": "aef2a80ff67e87a8c165a481ede2a643128f4aa7", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.9403530600868898, "ground_truth": 0}, {"key": "aef2a80ff67e87a8c165a481ede2a643128f4aa7", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.943763650391509, "ground_truth": 0}, {"key": "aef2a80ff67e87a8c165a481ede2a643128f4aa7", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.9299510419002928, "ground_truth": 0}, {"key": "aef2a80ff67e87a8c165a481ede2a643128f4aa7", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.9500414745599618, "ground_truth": 0}, {"key": "aef2a80ff67e87a8c165a481ede2a643128f4aa7", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.9390248172707034, "ground_truth": 0}, {"key": "d4eaedd7f1055f95e9cafa21e870d049f5df8526", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.5506073524874721, "ground_truth": 0}, {"key": "d4eaedd7f1055f95e9cafa21e870d049f5df8526", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.6242935171902753, "ground_truth": 0}, {"key": "d4eaedd7f1055f95e9cafa21e870d049f5df8526", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.5621765017611469, "ground_truth": 0}, {"key": "d4eaedd7f1055f95e9cafa21e870d049f5df8526", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.5774953655728317, "ground_truth": 0}, {"key": "d4eaedd7f1055f95e9cafa21e870d049f5df8526", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.5907792185394171, "ground_truth": 0}, {"key": "ec9531cd58e385f0da60e23b2855a3c5ece3f270", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.8128673197672517, "ground_truth": 0}, {"key": "ec9531cd58e385f0da60e23b2855a3c5ece3f270", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.6992544118669473, "ground_truth": 0}, {"key": "ec9531cd58e385f0da60e23b2855a3c5ece3f270", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.8489722047383694, "ground_truth": 0}, {"key": "ec9531cd58e385f0da60e23b2855a3c5ece3f270", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.8459424389346988, "ground_truth": 0}, {"key": "ec9531cd58e385f0da60e23b2855a3c5ece3f270", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.8333245967316857, "ground_truth": 0}, {"key": "b171bad51c8ec09118fd553347c41d9301f195ee", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.9105453995538829, "ground_truth": 0}, {"key": "b171bad51c8ec09118fd553347c41d9301f195ee", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.8577681112269271, "ground_truth": 0}, {"key": "b171bad51c8ec09118fd553347c41d9301f195ee", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.8940517155690627, "ground_truth": 0}, {"key": "b171bad51c8ec09118fd553347c41d9301f195ee", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.8539127453184137, "ground_truth": 0}, {"key": "b171bad51c8ec09118fd553347c41d9301f195ee", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.9433475735366145, "ground_truth": 0}, {"key": "1df14bd442bd39ed653aa77a1e77105d4b321db0", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.7476159520322654, "ground_truth": 0}, {"key": "1df14bd442bd39ed653aa77a1e77105d4b321db0", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.8092759808778183, "ground_truth": 0}, {"key": "1df14bd442bd39ed653aa77a1e77105d4b321db0", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.905989821098484, "ground_truth": 0}, {"key": "1df14bd442bd39ed653aa77a1e77105d4b321db0", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.8856314747322191, "ground_truth": 0}, {"key": "1df14bd442bd39ed653aa77a1e77105d4b321db0", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.8344068806581898, "ground_truth": 0}, {"key": "d4f57e3c18c38696345fb7a3d76a151bb9c5123b", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.6566582497175892, "ground_truth": 0}, {"key": "d4f57e3c18c38696345fb7a3d76a151bb9c5123b", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.64779821155913, "ground_truth": 0}, {"key": "d4f57e3c18c38696345fb7a3d76a151bb9c5123b", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.7799928939940602, "ground_truth": 0}, {"key": "d4f57e3c18c38696345fb7a3d76a151bb9c5123b", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.6001883327588291, "ground_truth": 0}, {"key": "d4f57e3c18c38696345fb7a3d76a151bb9c5123b", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.7969253697238662, "ground_truth": 0}, {"key": "28bbbf57c580be154f0602cbfe8b63603ef5a3a4", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.7943849571129973, "ground_truth": 0}, {"key": "28bbbf57c580be154f0602cbfe8b63603ef5a3a4", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.7008947971533747, "ground_truth": 0}, {"key": "28bbbf57c580be154f0602cbfe8b63603ef5a3a4", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.7431680085236738, "ground_truth": 0}, {"key": "28bbbf57c580be154f0602cbfe8b63603ef5a3a4", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.7549149886728008, "ground_truth": 0}, {"key": "28bbbf57c580be154f0602cbfe8b63603ef5a3a4", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.7264256060325888, "ground_truth": 0}, {"key": "05850904cabf491c9ab7c0e0d85fd932eb8c0bb0", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.7401743575483447, "ground_truth": 0}, {"key": "05850904cabf491c9ab7c0e0d85fd932eb8c0bb0", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.8128673008369842, "ground_truth": 0}, {"key": "05850904cabf491c9ab7c0e0d85fd932eb8c0bb0", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.7074046899746996, "ground_truth": 0}, {"key": "05850904cabf491c9ab7c0e0d85fd932eb8c0bb0", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.7577943694870043, "ground_truth": 0}, {"key": "05850904cabf491c9ab7c0e0d85fd932eb8c0bb0", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.7154240007319957, "ground_truth": 0}, {"key": "df79c0f955e4ccf51ad45780f865e334d3577bf5", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.782662493846982, "ground_truth": 0}, {"key": "df79c0f955e4ccf51ad45780f865e334d3577bf5", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.7341195245313328, "ground_truth": 0}, {"key": "df79c0f955e4ccf51ad45780f865e334d3577bf5", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.7839884862007851, "ground_truth": 0}, {"key": "df79c0f955e4ccf51ad45780f865e334d3577bf5", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.7718434876845847, "ground_truth": 0}, {"key": "df79c0f955e4ccf51ad45780f865e334d3577bf5", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.6584174882152056, "ground_truth": 0}, {"key": "ffb8b9be838da033f6f3383f324d425556723147", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.9032942156865018, "ground_truth": 0}, {"key": "ffb8b9be838da033f6f3383f324d425556723147", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.74613898103442, "ground_truth": 0}, {"key": "ffb8b9be838da033f6f3383f324d425556723147", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.8428631417665392, "ground_truth": 0}, {"key": "ffb8b9be838da033f6f3383f324d425556723147", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.8418256465144518, "ground_truth": 0}, {"key": "ffb8b9be838da033f6f3383f324d425556723147", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.8489721954420547, "ground_truth": 0}, {"key": "d70dcffc2c07e08cc121d7126ada53dbc479626e", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.7520125597301093, "ground_truth": 0}, {"key": "d70dcffc2c07e08cc121d7126ada53dbc479626e", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.8152324905439325, "ground_truth": 0}, {"key": "d70dcffc2c07e08cc121d7126ada53dbc479626e", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.795658096958971, "ground_truth": 0}, {"key": "d70dcffc2c07e08cc121d7126ada53dbc479626e", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.6636689551837253, "ground_truth": 0}, {"key": "d70dcffc2c07e08cc121d7126ada53dbc479626e", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.8255897286004608, "ground_truth": 0}, {"key": "4dc0cef39980df6382f9aee5e150e904fe62965e", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.8489721964215036, "ground_truth": 0}, {"key": "4dc0cef39980df6382f9aee5e150e904fe62965e", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.6584175109372923, "ground_truth": 0}, {"key": "4dc0cef39980df6382f9aee5e150e904fe62965e", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.7931059380200282, "ground_truth": 0}, {"key": "4dc0cef39980df6382f9aee5e150e904fe62965e", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.8615382061762435, "ground_truth": 0}, {"key": "4dc0cef39980df6382f9aee5e150e904fe62965e", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.7620701257055074, "ground_truth": 0}, {"key": "6cb082c504e00c93686ff1e9287a84ba13c12b79", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.8479677455060277, "ground_truth": 0}, {"key": "6cb082c504e00c93686ff1e9287a84ba13c12b79", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.6943026837890981, "ground_truth": 0}, {"key": "6cb082c504e00c93686ff1e9287a84ba13c12b79", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.6723316991604803, "ground_truth": 0}, {"key": "6cb082c504e00c93686ff1e9287a84ba13c12b79", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.7356416399398522, "ground_truth": 0}, {"key": "6cb082c504e00c93686ff1e9287a84ba13c12b79", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.841825653522752, "ground_truth": 0}, {"key": "19fe2a8e0bef37b495afcc83c2f46b60c56039bf", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.7401743634537591, "ground_truth": 0}, {"key": "19fe2a8e0bef37b495afcc83c2f46b60c56039bf", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.6791786863500847, "ground_truth": 0}, {"key": "19fe2a8e0bef37b495afcc83c2f46b60c56039bf", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.8267117878489946, "ground_truth": 0}, {"key": "19fe2a8e0bef37b495afcc83c2f46b60c56039bf", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.8539127650183684, "ground_truth": 0}, {"key": "19fe2a8e0bef37b495afcc83c2f46b60c56039bf", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.7786492995564664, "ground_truth": 0}, {"key": "503c6aaeaf0e61372a896ebe1fdf2a2492844fe4", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.7310585709553917, "ground_truth": 0}, {"key": "503c6aaeaf0e61372a896ebe1fdf2a2492844fe4", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.6876299946362671, "ground_truth": 0}, {"key": "503c6aaeaf0e61372a896ebe1fdf2a2492844fe4", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.7592254099325274, "ground_truth": 0}, {"key": "503c6aaeaf0e61372a896ebe1fdf2a2492844fe4", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.7690802440802441, "ground_truth": 0}, {"key": "503c6aaeaf0e61372a896ebe1fdf2a2492844fe4", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.7310585881793237, "ground_truth": 0}, {"key": "e4007135fdafe84907e2b018da3a4c7ab853c251", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.7981867673559292, "ground_truth": 0}, {"key": "e4007135fdafe84907e2b018da3a4c7ab853c251", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.6224593248474213, "ground_truth": 0}, {"key": "e4007135fdafe84907e2b018da3a4c7ab853c251", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.8267117919040748, "ground_truth": 0}, {"key": "e4007135fdafe84907e2b018da3a4c7ab853c251", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.7745833998576183, "ground_truth": 0}, {"key": "e4007135fdafe84907e2b018da3a4c7ab853c251", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.7490872073657401, "ground_truth": 0}, {"key": "5b97a507eed113ce329e8c85078fb53033bbe567", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.7401743375210946, "ground_truth": 0}, {"key": "5b97a507eed113ce329e8c85078fb53033bbe567", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.5214711496022008, "ground_truth": 0}, {"key": "5b97a507eed113ce329e8c85078fb53033bbe567", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.6150878386281231, "ground_truth": 0}, {"key": "5b97a507eed113ce329e8c85078fb53033bbe567", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.560252664419423, "ground_truth": 0}, {"key": "5b97a507eed113ce329e8c85078fb53033bbe567", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.7866228207502902, "ground_truth": 0}, {"key": "145a118e355e3a92383b41307a5b473a7c77a8bb", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.6943026841542806, "ground_truth": 0}, {"key": "145a118e355e3a92383b41307a5b473a7c77a8bb", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.8548846444842652, "ground_truth": 0}, {"key": "145a118e355e3a92383b41307a5b473a7c77a8bb", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.7446563417698457, "ground_truth": 0}, {"key": "145a118e355e3a92383b41307a5b473a7c77a8bb", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.7476159386632394, "ground_truth": 0}, {"key": "145a118e355e3a92383b41307a5b473a7c77a8bb", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.786622835085316, "ground_truth": 0}, {"key": "1f6309c88c5711b2b579e3c0cf699c44d3b56d16", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.83761997331552, "ground_truth": 0}, {"key": "1f6309c88c5711b2b579e3c0cf699c44d3b56d16", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.7634837713466947, "ground_truth": 0}, {"key": "1f6309c88c5711b2b579e3c0cf699c44d3b56d16", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.7718434965651472, "ground_truth": 0}, {"key": "1f6309c88c5711b2b579e3c0cf699c44d3b56d16", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.8278281383862054, "ground_truth": 0}, {"key": "1f6309c88c5711b2b579e3c0cf699c44d3b56d16", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.7279754454845215, "ground_truth": 0}, {"key": "d8304c60e76a4b16053e74c50abd886dcdf7397c", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.8198933357425381, "ground_truth": 0}, {"key": "d8304c60e76a4b16053e74c50abd886dcdf7397c", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.7866228255619772, "ground_truth": 0}, {"key": "d8304c60e76a4b16053e74c50abd886dcdf7397c", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.8397339710230841, "ground_truth": 0}, {"key": "d8304c60e76a4b16053e74c50abd886dcdf7397c", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.750552768124525, "ground_truth": 0}, {"key": "d8304c60e76a4b16053e74c50abd886dcdf7397c", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.7879311953459173, "ground_truth": 0}, {"key": "d47e5724a866cf365428dbded7740555e5f80f2b", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.8164063719671099, "ground_truth": 0}, {"key": "d47e5724a866cf365428dbded7740555e5f80f2b", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.7956580937102602, "ground_truth": 0}, {"key": "d47e5724a866cf365428dbded7740555e5f80f2b", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.7918210599782192, "ground_truth": 0}, {"key": "d47e5724a866cf365428dbded7740555e5f80f2b", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.8128673180882304, "ground_truth": 0}, {"key": "d47e5724a866cf365428dbded7740555e5f80f2b", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.8255897297213238, "ground_truth": 0}, {"key": "0a078513cee66db2ccaaca1b7b0755c96f0c5c8a", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.8887587932164263, "ground_truth": 0}, {"key": "0a078513cee66db2ccaaca1b7b0755c96f0c5c8a", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.9600626833755852, "ground_truth": 0}, {"key": "0a078513cee66db2ccaaca1b7b0755c96f0c5c8a", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.8933094114390836, "ground_truth": 0}, {"key": "0a078513cee66db2ccaaca1b7b0755c96f0c5c8a", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.943347573434571, "ground_truth": 0}, {"key": "0a078513cee66db2ccaaca1b7b0755c96f0c5c8a", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.9263037243073272, "ground_truth": 0}, {"key": "f0d93bdd383762936746b48f7e67ffe72cfb1ede", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.8539127550410794, "ground_truth": 0}, {"key": "f0d93bdd383762936746b48f7e67ffe72cfb1ede", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.7704648029959302, "ground_truth": 0}, {"key": "f0d93bdd383762936746b48f7e67ffe72cfb1ede", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.6654105580624285, "ground_truth": 0}, {"key": "f0d93bdd383762936746b48f7e67ffe72cfb1ede", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.8152324866571847, "ground_truth": 0}, {"key": "f0d93bdd383762936746b48f7e67ffe72cfb1ede", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.7839884579510922, "ground_truth": 0}, {"key": "38649fdccec39afa649297349b2ad2e5e1a39d82", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.8872046004378075, "ground_truth": 0}, {"key": "38649fdccec39afa649297349b2ad2e5e1a39d82", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.9136765188476181, "ground_truth": 0}, {"key": "38649fdccec39afa649297349b2ad2e5e1a39d82", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.8587185770121031, "ground_truth": 0}, {"key": "38649fdccec39afa649297349b2ad2e5e1a39d82", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.8984105509335734, "ground_truth": 0}, {"key": "38649fdccec39afa649297349b2ad2e5e1a39d82", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.88720460427959, "ground_truth": 0}, {"key": "d86d9a4e0b39556578f24ff54ed82716f0375fdb", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.8933093966440726, "ground_truth": 0}, {"key": "d86d9a4e0b39556578f24ff54ed82716f0375fdb", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.8006920058574586, "ground_truth": 0}, {"key": "d86d9a4e0b39556578f24ff54ed82716f0375fdb", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.8509647038778703, "ground_truth": 0}, {"key": "d86d9a4e0b39556578f24ff54ed82716f0375fdb", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.7853085796512292, "ground_truth": 0}, {"key": "d86d9a4e0b39556578f24ff54ed82716f0375fdb", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.7839884783368357, "ground_truth": 0}, {"key": "d10d57811499caa54276d3e14f89c45cb1a8958f", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.7074046903202607, "ground_truth": 0}, {"key": "d10d57811499caa54276d3e14f89c45cb1a8958f", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.5602526680816658, "ground_truth": 0}, {"key": "d10d57811499caa54276d3e14f89c45cb1a8958f", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.7041601269377877, "ground_truth": 0}, {"key": "d10d57811499caa54276d3e14f89c45cb1a8958f", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.7122322011048278, "ground_truth": 0}, {"key": "d10d57811499caa54276d3e14f89c45cb1a8958f", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.6876299933490408, "ground_truth": 0}, {"key": "66646c49afb65308491ec8ca6db79aa76263cc69", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.9019206720245937, "ground_truth": 0}, {"key": "66646c49afb65308491ec8ca6db79aa76263cc69", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.894051718334492, "ground_truth": 0}, {"key": "66646c49afb65308491ec8ca6db79aa76263cc69", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.7057850148002713, "ground_truth": 0}, {"key": "66646c49afb65308491ec8ca6db79aa76263cc69", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.763483763704352, "ground_truth": 0}, {"key": "66646c49afb65308491ec8ca6db79aa76263cc69", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.7264256336474778, "ground_truth": 0}, {"key": "7fbd6d867def06f6ae4c051562dc36ab8d0038c0", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.9294404042159596, "ground_truth": 0}, {"key": "7fbd6d867def06f6ae4c051562dc36ab8d0038c0", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.8333245963046786, "ground_truth": 0}, {"key": "7fbd6d867def06f6ae4c051562dc36ab8d0038c0", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.9230391582805225, "ground_truth": 0}, {"key": "7fbd6d867def06f6ae4c051562dc36ab8d0038c0", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.8962513708171087, "ground_truth": 0}, {"key": "7fbd6d867def06f6ae4c051562dc36ab8d0038c0", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.9429286009460558, "ground_truth": 0}, {"key": "5c243b51bf4de7f6974338d71ac26317254007bb", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.9372107889686292, "ground_truth": 0}, {"key": "5c243b51bf4de7f6974338d71ac26317254007bb", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.8469578482692296, "ground_truth": 0}, {"key": "5c243b51bf4de7f6974338d71ac26317254007bb", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.899121384911425, "ground_truth": 0}, {"key": "5c243b51bf4de7f6974338d71ac26317254007bb", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.8489721934043026, "ground_truth": 0}, {"key": "5c243b51bf4de7f6974338d71ac26317254007bb", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.8807970814497629, "ground_truth": 0}, {"key": "56b79c03a77d5261382e4705f3537396473f55cf", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.9563089419214778, "ground_truth": 0}, {"key": "56b79c03a77d5261382e4705f3537396473f55cf", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.9294404047884784, "ground_truth": 0}, {"key": "56b79c03a77d5261382e4705f3537396473f55cf", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.9635062338283836, "ground_truth": 0}, {"key": "56b79c03a77d5261382e4705f3537396473f55cf", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.905989812285736, "ground_truth": 0}, {"key": "56b79c03a77d5261382e4705f3537396473f55cf", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.9339146222831124, "ground_truth": 0}, {"key": "7382d171d71d3219c5ad0a13ea0ac92ac6b6998b", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.798186795879922, "ground_truth": 0}, {"key": "7382d171d71d3219c5ad0a13ea0ac92ac6b6998b", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.8807970834699786, "ground_truth": 0}, {"key": "7382d171d71d3219c5ad0a13ea0ac92ac6b6998b", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.6095241726328702, "ground_truth": 0}, {"key": "7382d171d71d3219c5ad0a13ea0ac92ac6b6998b", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.878314250740096, "ground_truth": 0}, {"key": "7382d171d71d3219c5ad0a13ea0ac92ac6b6998b", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.799442320712916, "ground_truth": 0}, {"key": "ef1a5fa8dbba16e4d7ef3fc8cd540c2f55691fc8", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.8479677496518636, "ground_truth": 0}, {"key": "ef1a5fa8dbba16e4d7ef3fc8cd540c2f55691fc8", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.812867307825807, "ground_truth": 0}, {"key": "ef1a5fa8dbba16e4d7ef3fc8cd540c2f55691fc8", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.8289388196325651, "ground_truth": 0}, {"key": "ef1a5fa8dbba16e4d7ef3fc8cd540c2f55691fc8", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.8577681078609486, "ground_truth": 0}, {"key": "ef1a5fa8dbba16e4d7ef3fc8cd540c2f55691fc8", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.8509647048902741, "ground_truth": 0}, {"key": "1ba0f66a7f4f23171634a3455893f4d5b8b94db4", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.8386797606890527, "ground_truth": 0}, {"key": "1ba0f66a7f4f23171634a3455893f4d5b8b94db4", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.8322366457607308, "ground_truth": 0}, {"key": "1ba0f66a7f4f23171634a3455893f4d5b8b94db4", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.8128673038987089, "ground_truth": 0}, {"key": "1ba0f66a7f4f23171634a3455893f4d5b8b94db4", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.7592254027322073, "ground_truth": 0}, {"key": "1ba0f66a7f4f23171634a3455893f4d5b8b94db4", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.622459323057233, "ground_truth": 0}, {"key": "3131e8ba238a31d83cad00bc7b02933b0a3587b3", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.7866228450777993, "ground_truth": 0}, {"key": "3131e8ba238a31d83cad00bc7b02933b0a3587b3", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.8548846444842652, "ground_truth": 0}, {"key": "3131e8ba238a31d83cad00bc7b02933b0a3587b3", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.7732163613529895, "ground_truth": 0}, {"key": "3131e8ba238a31d83cad00bc7b02933b0a3587b3", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.7476159386632394, "ground_truth": 0}, {"key": "3131e8ba238a31d83cad00bc7b02933b0a3587b3", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.786622835085316, "ground_truth": 0}, {"key": "112bc4ab4b6e7d6dd35fc33cd946fbfc4c9356d6", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.7892336876902369, "ground_truth": 0}, {"key": "112bc4ab4b6e7d6dd35fc33cd946fbfc4c9356d6", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.847967754031791, "ground_truth": 0}, {"key": "112bc4ab4b6e7d6dd35fc33cd946fbfc4c9356d6", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.837619965133565, "ground_truth": 0}, {"key": "112bc4ab4b6e7d6dd35fc33cd946fbfc4c9356d6", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.852935475753593, "ground_truth": 0}, {"key": "112bc4ab4b6e7d6dd35fc33cd946fbfc4c9356d6", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.8652240819876637, "ground_truth": 0}, {"key": "3b1d3309825780556178569cd40d880a793f8da7", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.8577681064468254, "ground_truth": 0}, {"key": "3b1d3309825780556178569cd40d880a793f8da7", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.848972190451112, "ground_truth": 0}, {"key": "3b1d3309825780556178569cd40d880a793f8da7", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.8548846393265782, "ground_truth": 0}, {"key": "3b1d3309825780556178569cd40d880a793f8da7", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.8969755712050345, "ground_truth": 0}, {"key": "3b1d3309825780556178569cd40d880a793f8da7", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.8140528157044126, "ground_truth": 0}, {"key": "c977693b405a89cec98e53b05199e608fd6adeca", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.6859494567247064, "ground_truth": 0}, {"key": "c977693b405a89cec98e53b05199e608fd6adeca", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.877476784414151, "ground_truth": 0}, {"key": "c977693b405a89cec98e53b05199e608fd6adeca", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.7461389810899657, "ground_truth": 0}, {"key": "c977693b405a89cec98e53b05199e608fd6adeca", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.8596637555679932, "ground_truth": 0}, {"key": "c977693b405a89cec98e53b05199e608fd6adeca", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.8661325076904773, "ground_truth": 0}, {"key": "c84e272a80fa95f863e016bc54df0841fd83fc12", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.8152324862885019, "ground_truth": 0}, {"key": "c84e272a80fa95f863e016bc54df0841fd83fc12", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.6424325169547827, "ground_truth": 0}, {"key": "c84e272a80fa95f863e016bc54df0841fd83fc12", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.8164063757931952, "ground_truth": 0}, {"key": "c84e272a80fa95f863e016bc54df0841fd83fc12", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.7620701081295903, "ground_truth": 0}, {"key": "c84e272a80fa95f863e016bc54df0841fd83fc12", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.857768106491836, "ground_truth": 0}, {"key": "f51cff1d73cd0f3954376d7b3eab1d5b2ccb354c", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.7490872177160951, "ground_truth": 0}, {"key": "f51cff1d73cd0f3954376d7b3eab1d5b2ccb354c", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.7676898609050006, "ground_truth": 0}, {"key": "f51cff1d73cd0f3954376d7b3eab1d5b2ccb354c", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.7563575504505963, "ground_truth": 0}, {"key": "f51cff1d73cd0f3954376d7b3eab1d5b2ccb354c", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.6477982160848915, "ground_truth": 0}, {"key": "f51cff1d73cd0f3954376d7b3eab1d5b2ccb354c", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.7356416398184782, "ground_truth": 0}, {"key": "a98f1a0258f641788e570264b79e5c816f80054f", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.7505527636902076, "ground_truth": 0}, {"key": "a98f1a0258f641788e570264b79e5c816f80054f", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.7431680026943847, "ground_truth": 0}, {"key": "a98f1a0258f641788e570264b79e5c816f80054f", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.8407826050927081, "ground_truth": 0}, {"key": "a98f1a0258f641788e570264b79e5c816f80054f", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.7866228222378838, "ground_truth": 0}, {"key": "a98f1a0258f641788e570264b79e5c816f80054f", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.5755880055669879, "ground_truth": 0}, {"key": "d69d50059c96bd729e9e4c54eee7901d43c0181d", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.9615338063712222, "ground_truth": 0}, {"key": "d69d50059c96bd729e9e4c54eee7901d43c0181d", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.9626731114453864, "ground_truth": 0}, {"key": "d69d50059c96bd729e9e4c54eee7901d43c0181d", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.9319595807630479, "ground_truth": 0}, {"key": "d69d50059c96bd729e9e4c54eee7901d43c0181d", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.933914630902237, "ground_truth": 0}, {"key": "d69d50059c96bd729e9e4c54eee7901d43c0181d", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.8749346229743448, "ground_truth": 0}, {"key": "379692c378381f092c0bae0516ea8abc5bdb98b8", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.7866228335221026, "ground_truth": 0}, {"key": "379692c378381f092c0bae0516ea8abc5bdb98b8", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.789233709988809, "ground_truth": 0}, {"key": "379692c378381f092c0bae0516ea8abc5bdb98b8", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.6279511932707635, "ground_truth": 0}, {"key": "379692c378381f092c0bae0516ea8abc5bdb98b8", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.7786493130859784, "ground_truth": 0}, {"key": "379692c378381f092c0bae0516ea8abc5bdb98b8", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.8539127481434109, "ground_truth": 0}, {"key": "88b0d86cd06cd05a090f6a6c3a3ed17bf5f96df3", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.823328399649321, "ground_truth": 0}, {"key": "88b0d86cd06cd05a090f6a6c3a3ed17bf5f96df3", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.932943712460311, "ground_truth": 0}, {"key": "88b0d86cd06cd05a090f6a6c3a3ed17bf5f96df3", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.8732148315482358, "ground_truth": 0}, {"key": "88b0d86cd06cd05a090f6a6c3a3ed17bf5f96df3", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.9039745061854664, "ground_truth": 0}, {"key": "88b0d86cd06cd05a090f6a6c3a3ed17bf5f96df3", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.8548846442917858, "ground_truth": 0}, {"key": "3b46e80db81819fdcb8b8044941f64d0fa5abd11", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.7994423295926686, "ground_truth": 0}, {"key": "3b46e80db81819fdcb8b8044941f64d0fa5abd11", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.8140528035586798, "ground_truth": 0}, {"key": "3b46e80db81819fdcb8b8044941f64d0fa5abd11", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.6352224467709175, "ground_truth": 0}, {"key": "3b46e80db81819fdcb8b8044941f64d0fa5abd11", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.8104789011039002, "ground_truth": 0}, {"key": "3b46e80db81819fdcb8b8044941f64d0fa5abd11", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.7185943983209129, "ground_truth": 0}, {"key": "786d56f09dae2902696b680395353986051a1139", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.6495786207539469, "ground_truth": 0}, {"key": "786d56f09dae2902696b680395353986051a1139", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.6057990673947276, "ground_truth": 0}, {"key": "786d56f09dae2902696b680395353986051a1139", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.74316799007805, "ground_truth": 0}, {"key": "786d56f09dae2902696b680395353986051a1139", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.6315942958072387, "ground_truth": 0}, {"key": "786d56f09dae2902696b680395353986051a1139", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.5486734790488003, "ground_truth": 0}, {"key": "bf1a3fd65fdd6e91ccec0663d80fa567eada14df", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.9299510386624339, "ground_truth": 0}, {"key": "bf1a3fd65fdd6e91ccec0663d80fa567eada14df", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.8365545613045073, "ground_truth": 0}, {"key": "bf1a3fd65fdd6e91ccec0663d80fa567eada14df", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.7918210814519282, "ground_truth": 0}, {"key": "bf1a3fd65fdd6e91ccec0663d80fa567eada14df", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.6909762996489471, "ground_truth": 0}, {"key": "bf1a3fd65fdd6e91ccec0663d80fa567eada14df", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.9086178919586976, "ground_truth": 0}, {"key": "a0bd3047a6de80e3924843f1961ce28347c6a548", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.627951209639296, "ground_truth": 0}, {"key": "a0bd3047a6de80e3924843f1961ce28347c6a548", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.8697145748262575, "ground_truth": 0}, {"key": "a0bd3047a6de80e3924843f1961ce28347c6a548", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.7690802460182886, "ground_truth": 0}, {"key": "a0bd3047a6de80e3924843f1961ce28347c6a548", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.7248702817653194, "ground_truth": 0}, {"key": "a0bd3047a6de80e3924843f1961ce28347c6a548", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.5926665906117078, "ground_truth": 0}, {"key": "090d322e93af624203dbd5dc83403170071c9e6a", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.8587185797729424, "ground_truth": 0}, {"key": "090d322e93af624203dbd5dc83403170071c9e6a", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.9184802490740002, "ground_truth": 0}, {"key": "090d322e93af624203dbd5dc83403170071c9e6a", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.913058337675755, "ground_truth": 0}, {"key": "090d322e93af624203dbd5dc83403170071c9e6a", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.9246876935600259, "ground_truth": 0}, {"key": "090d322e93af624203dbd5dc83403170071c9e6a", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.8757869963653179, "ground_truth": 0}, {"key": "ed5179817cb8f597a760800fcdce2b8e64fd30dc", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.7549149974310011, "ground_truth": 0}, {"key": "ed5179817cb8f597a760800fcdce2b8e64fd30dc", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.8407825942876127, "ground_truth": 0}, {"key": "ed5179817cb8f597a760800fcdce2b8e64fd30dc", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.7745833972159135, "ground_truth": 0}, {"key": "ed5179817cb8f597a760800fcdce2b8e64fd30dc", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.7648916219601223, "ground_truth": 0}, {"key": "ed5179817cb8f597a760800fcdce2b8e64fd30dc", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.8856314767318959, "ground_truth": 0}, {"key": "571a8023d0deed8c667dd41fed88290309e56927", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.5058591045137562, "ground_truth": 0}, {"key": "571a8023d0deed8c667dd41fed88290309e56927", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.6893056068163417, "ground_truth": 0}, {"key": "571a8023d0deed8c667dd41fed88290309e56927", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.40356687380750456, "ground_truth": 0}, {"key": "571a8023d0deed8c667dd41fed88290309e56927", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.6057990412916613, "ground_truth": 0}, {"key": "571a8023d0deed8c667dd41fed88290309e56927", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.490235638514652, "ground_truth": 0}, {"key": "544d7c0cba7df38cc8dda8d0d91c6845cf5f52bb", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.3380771490325089, "ground_truth": 0}, {"key": "544d7c0cba7df38cc8dda8d0d91c6845cf5f52bb", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.7154240005687593, "ground_truth": 0}, {"key": "544d7c0cba7df38cc8dda8d0d91c6845cf5f52bb", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.5467381506647393, "ground_truth": 0}, {"key": "544d7c0cba7df38cc8dda8d0d91c6845cf5f52bb", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.6279512061582453, "ground_truth": 0}, {"key": "544d7c0cba7df38cc8dda8d0d91c6845cf5f52bb", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.6388352675915556, "ground_truth": 0}, {"key": "cbd3a0715a91ac8f651aa7b1f2c1fb37a2ef8a69", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.7201715078575891, "ground_truth": 0}, {"key": "cbd3a0715a91ac8f651aa7b1f2c1fb37a2ef8a69", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.6976089027825745, "ground_truth": 0}, {"key": "cbd3a0715a91ac8f651aa7b1f2c1fb37a2ef8a69", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.8697145814657337, "ground_truth": 0}, {"key": "cbd3a0715a91ac8f651aa7b1f2c1fb37a2ef8a69", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.7634837626581148, "ground_truth": 0}, {"key": "cbd3a0715a91ac8f651aa7b1f2c1fb37a2ef8a69", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.8587185776664592, "ground_truth": 0}, {"key": "4ca8b3cf75948dffea7b96e71bf1d9621107354b", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.9549844652713189, "ground_truth": 0}, {"key": "4ca8b3cf75948dffea7b96e71bf1d9621107354b", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.931462509386814, "ground_truth": 0}, {"key": "4ca8b3cf75948dffea7b96e71bf1d9621107354b", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.9591542846545471, "ground_truth": 0}, {"key": "4ca8b3cf75948dffea7b96e71bf1d9621107354b", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.9425067276353373, "ground_truth": 0}, {"key": "4ca8b3cf75948dffea7b96e71bf1d9621107354b", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.9299510356505397, "ground_truth": 0}, {"key": "98f04e49605f36e0236b206fcb26a1549a7c00c6", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.7431680047510105, "ground_truth": 0}, {"key": "98f04e49605f36e0236b206fcb26a1549a7c00c6", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.9032942142115467, "ground_truth": 0}, {"key": "98f04e49605f36e0236b206fcb26a1549a7c00c6", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.7648916043164, "ground_truth": 0}, {"key": "98f04e49605f36e0236b206fcb26a1549a7c00c6", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.8233283932903934, "ground_truth": 0}, {"key": "98f04e49605f36e0236b206fcb26a1549a7c00c6", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.7325918270773547, "ground_truth": 0}, {"key": "fb0003754a764d7f3252120de58b515d1f882556", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.8354835397440779, "ground_truth": 0}, {"key": "fb0003754a764d7f3252120de58b515d1f882556", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.8333246006178286, "ground_truth": 0}, {"key": "fb0003754a764d7f3252120de58b515d1f882556", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.8969755686482211, "ground_truth": 0}, {"key": "fb0003754a764d7f3252120de58b515d1f882556", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.717011864879109, "ground_truth": 0}, {"key": "fb0003754a764d7f3252120de58b515d1f882556", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.8006919921353282, "ground_truth": 0}, {"key": "0130f10c1d700cf42cad5fd24b242667342c86be", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.6279512185999798, "ground_truth": 0}, {"key": "0130f10c1d700cf42cad5fd24b242667342c86be", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.679178689604215, "ground_truth": 0}, {"key": "0130f10c1d700cf42cad5fd24b242667342c86be", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.6584175033959339, "ground_truth": 0}, {"key": "0130f10c1d700cf42cad5fd24b242667342c86be", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.6001883312814816, "ground_truth": 0}, {"key": "0130f10c1d700cf42cad5fd24b242667342c86be", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.5292633932197126, "ground_truth": 0}, {"key": "fb8431bc320c2c1a6c32699da0fdae228ed8d73b", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.7718435000510597, "ground_truth": 0}, {"key": "fb8431bc320c2c1a6c32699da0fdae228ed8d73b", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.7185944020809304, "ground_truth": 0}, {"key": "fb8431bc320c2c1a6c32699da0fdae228ed8d73b", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.7401743666121512, "ground_truth": 0}, {"key": "fb8431bc320c2c1a6c32699da0fdae228ed8d73b", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.7905303132768572, "ground_truth": 0}, {"key": "fb8431bc320c2c1a6c32699da0fdae228ed8d73b", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.6808786146513638, "ground_truth": 0}, {"key": "875d564015e85f88103edf0b36ce10e292334902", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.8459424359045858, "ground_truth": 0}, {"key": "875d564015e85f88103edf0b36ce10e292334902", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.7401743677094491, "ground_truth": 0}, {"key": "875d564015e85f88103edf0b36ce10e292334902", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.9235923057814123, "ground_truth": 0}, {"key": "875d564015e85f88103edf0b36ce10e292334902", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.6774740177801563, "ground_truth": 0}, {"key": "875d564015e85f88103edf0b36ce10e292334902", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.8407825940268828, "ground_truth": 0}, {"key": "53102b470b50905c033a90940fc6fa87190f7343", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.8322366538953936, "ground_truth": 0}, {"key": "53102b470b50905c033a90940fc6fa87190f7343", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.8766343852643828, "ground_truth": 0}, {"key": "53102b470b50905c033a90940fc6fa87190f7343", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.9219218410297312, "ground_truth": 0}, {"key": "53102b470b50905c033a90940fc6fa87190f7343", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.9473810416549486, "ground_truth": 0}, {"key": "53102b470b50905c033a90940fc6fa87190f7343", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.8128673187082074, "ground_truth": 0}, {"key": "58776b77856719aff45f09e50d370f52c756dc10", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.8244619356657839, "ground_truth": 0}, {"key": "58776b77856719aff45f09e50d370f52c756dc10", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.8175744723058489, "ground_truth": 0}, {"key": "58776b77856719aff45f09e50d370f52c756dc10", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.832236655561266, "ground_truth": 0}, {"key": "58776b77856719aff45f09e50d370f52c756dc10", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.844921526970444, "ground_truth": 0}, {"key": "58776b77856719aff45f09e50d370f52c756dc10", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.853912743362919, "ground_truth": 0}, {"key": "1b1479bb6e290e86e4b2a1e862e06909a0a62f8e", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.710628303545466, "ground_truth": 0}, {"key": "1b1479bb6e290e86e4b2a1e862e06909a0a62f8e", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.8198933436350635, "ground_truth": 0}, {"key": "1b1479bb6e290e86e4b2a1e862e06909a0a62f8e", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.7490872153394794, "ground_truth": 0}, {"key": "1b1479bb6e290e86e4b2a1e862e06909a0a62f8e", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.8140527811785411, "ground_truth": 0}, {"key": "1b1479bb6e290e86e4b2a1e862e06909a0a62f8e", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.8418256453056028, "ground_truth": 0}, {"key": "137019bb8262f8ab776ec6367a0ae4b020fa638e", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.8068526183949848, "ground_truth": 0}, {"key": "137019bb8262f8ab776ec6367a0ae4b020fa638e", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.8615382172717747, "ground_truth": 0}, {"key": "137019bb8262f8ab776ec6367a0ae4b020fa638e", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.6688802664088923, "ground_truth": 0}, {"key": "137019bb8262f8ab776ec6367a0ae4b020fa638e", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.854884636571692, "ground_truth": 0}, {"key": "137019bb8262f8ab776ec6367a0ae4b020fa638e", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.9046505387144578, "ground_truth": 0}, {"key": "1f738e018a3a193d04ec22612e4fe6b01b4969fe", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.84182564653356, "ground_truth": 0}, {"key": "1f738e018a3a193d04ec22612e4fe6b01b4969fe", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.8221891265518422, "ground_truth": 0}, {"key": "1f738e018a3a193d04ec22612e4fe6b01b4969fe", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.7401743508619019, "ground_truth": 0}, {"key": "1f738e018a3a193d04ec22612e4fe6b01b4969fe", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.8019358254025862, "ground_truth": 0}, {"key": "1f738e018a3a193d04ec22612e4fe6b01b4969fe", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.8438951046259122, "ground_truth": 0}, {"key": "2bb7b7d5a229ccb9c9b5b4fa1475a54297fc0a25", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.9219218384053707, "ground_truth": 0}, {"key": "2bb7b7d5a229ccb9c9b5b4fa1475a54297fc0a25", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.9643214462156485, "ground_truth": 0}, {"key": "2bb7b7d5a229ccb9c9b5b4fa1475a54297fc0a25", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.8624675224092455, "ground_truth": 0}, {"key": "2bb7b7d5a229ccb9c9b5b4fa1475a54297fc0a25", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.9500414740022614, "ground_truth": 0}, {"key": "2bb7b7d5a229ccb9c9b5b4fa1475a54297fc0a25", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.9425067265049948, "ground_truth": 0}, {"key": "c136c209869b227e534aca60b6df7e0b26bce7fe", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.8469578365925063, "ground_truth": 0}, {"key": "c136c209869b227e534aca60b6df7e0b26bce7fe", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.7534666652812517, "ground_truth": 0}, {"key": "c136c209869b227e534aca60b6df7e0b26bce7fe", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.6808786239410289, "ground_truth": 0}, {"key": "c136c209869b227e534aca60b6df7e0b26bce7fe", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.8824278653223067, "ground_truth": 0}, {"key": "c136c209869b227e534aca60b6df7e0b26bce7fe", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.8587185706390633, "ground_truth": 0}, {"key": "bfbf2be3d5b9da8425253502393528d0f95d2b5d", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.6808786013719801, "ground_truth": 0}, {"key": "bfbf2be3d5b9da8425253502393528d0f95d2b5d", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.9394706103958023, "ground_truth": 0}, {"key": "bfbf2be3d5b9da8425253502393528d0f95d2b5d", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.9118099550578174, "ground_truth": 0}, {"key": "bfbf2be3d5b9da8425253502393528d0f95d2b5d", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.8740772312303922, "ground_truth": 0}, {"key": "bfbf2be3d5b9da8425253502393528d0f95d2b5d", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.9429285986797893, "ground_truth": 0}, {"key": "de149988c9768a12f4a656f1d86efe42af51b4c8", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.8925625327312984, "ground_truth": 0}, {"key": "de149988c9768a12f4a656f1d86efe42af51b4c8", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.8407826071223702, "ground_truth": 0}, {"key": "de149988c9768a12f4a656f1d86efe42af51b4c8", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.8529354691967543, "ground_truth": 0}, {"key": "de149988c9768a12f4a656f1d86efe42af51b4c8", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.894051712943462, "ground_truth": 0}, {"key": "de149988c9768a12f4a656f1d86efe42af51b4c8", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.9246876913451858, "ground_truth": 0}, {"key": "45986f43dd61461844801c08c8753a71ccbf9083", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.8438951031515294, "ground_truth": 0}, {"key": "45986f43dd61461844801c08c8753a71ccbf9083", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.7718435046599657, "ground_truth": 0}, {"key": "45986f43dd61461844801c08c8753a71ccbf9083", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.6261241762340835, "ground_truth": 0}, {"key": "45986f43dd61461844801c08c8753a71ccbf9083", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.8705972707768526, "ground_truth": 0}, {"key": "45986f43dd61461844801c08c8753a71ccbf9083", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.8856314730792156, "ground_truth": 0}, {"key": "e27256e1314f48219ceca70c273dd8429fc4ca4f", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.8376199729621796, "ground_truth": 0}, {"key": "e27256e1314f48219ceca70c273dd8429fc4ca4f", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.8006919890109162, "ground_truth": 0}, {"key": "e27256e1314f48219ceca70c273dd8429fc4ca4f", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.8902942258611661, "ground_truth": 0}, {"key": "e27256e1314f48219ceca70c273dd8429fc4ca4f", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.8407826052564045, "ground_truth": 0}, {"key": "e27256e1314f48219ceca70c273dd8429fc4ca4f", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.8397339626643282, "ground_truth": 0}, {"key": "8da9fddf6f4a0d798e454ee7b778ce0d7ce3c447", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.7931059552973374, "ground_truth": 0}, {"key": "8da9fddf6f4a0d798e454ee7b778ce0d7ce3c447", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.8548846376137376, "ground_truth": 0}, {"key": "8da9fddf6f4a0d798e454ee7b778ce0d7ce3c447", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.8688267727162479, "ground_truth": 0}, {"key": "8da9fddf6f4a0d798e454ee7b778ce0d7ce3c447", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.8624675246839884, "ground_truth": 0}, {"key": "8da9fddf6f4a0d798e454ee7b778ce0d7ce3c447", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.8044059139376232, "ground_truth": 0}, {"key": "d2e357c372891291bbdb4f496792ea9d5807cd3a", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.9381240108938405, "ground_truth": 0}, {"key": "d2e357c372891291bbdb4f496792ea9d5807cd3a", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.9693242016690887, "ground_truth": 0}, {"key": "d2e357c372891291bbdb4f496792ea9d5807cd3a", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.9202179888969637, "ground_truth": 0}, {"key": "d2e357c372891291bbdb4f496792ea9d5807cd3a", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.9777138145840777, "ground_truth": 0}, {"key": "d2e357c372891291bbdb4f496792ea9d5807cd3a", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.9284087970398953, "ground_truth": 0}, {"key": "2a17cad6a35f54ceab81d03772a75c58aa7147ef", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.9046505409692636, "ground_truth": 0}, {"key": "2a17cad6a35f54ceab81d03772a75c58aa7147ef", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.7690802518072649, "ground_truth": 0}, {"key": "2a17cad6a35f54ceab81d03772a75c58aa7147ef", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.7008948165099058, "ground_truth": 0}, {"key": "2a17cad6a35f54ceab81d03772a75c58aa7147ef", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.89105495065065, "ground_truth": 0}, {"key": "2a17cad6a35f54ceab81d03772a75c58aa7147ef", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.7170118723810924, "ground_truth": 0}, {"key": "4b25022fda48e7f91ab1459f1a6dca501318672e", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.7476159613614841, "ground_truth": 0}, {"key": "4b25022fda48e7f91ab1459f1a6dca501318672e", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.7620701088824994, "ground_truth": 0}, {"key": "4b25022fda48e7f91ab1459f1a6dca501318672e", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.7994423165767527, "ground_truth": 0}, {"key": "4b25022fda48e7f91ab1459f1a6dca501318672e", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.8438950897328639, "ground_truth": 0}, {"key": "4b25022fda48e7f91ab1459f1a6dca501318672e", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.6187804241181701, "ground_truth": 0}, {"key": "62066d76f4ef9e06a1129551c41371bb5d2f7465", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.9715639683696449, "ground_truth": 0}, {"key": "62066d76f4ef9e06a1129551c41371bb5d2f7465", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.9780517460916369, "ground_truth": 0}, {"key": "62066d76f4ef9e06a1129551c41371bb5d2f7465", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.9736446450593474, "ground_truth": 0}, {"key": "62066d76f4ef9e06a1129551c41371bb5d2f7465", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.9661559651206212, "ground_truth": 0}, {"key": "62066d76f4ef9e06a1129551c41371bb5d2f7465", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.974042643303258, "ground_truth": 0}, {"key": "16c4a27e42066259797d93d5db0239bce0a15f18", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.7549149925057514, "ground_truth": 0}, {"key": "16c4a27e42066259797d93d5db0239bce0a15f18", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.7772998513971111, "ground_truth": 0}, {"key": "16c4a27e42066259797d93d5db0239bce0a15f18", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.86153820342247, "ground_truth": 0}, {"key": "16c4a27e42066259797d93d5db0239bce0a15f18", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.7918210681566734, "ground_truth": 0}, {"key": "16c4a27e42066259797d93d5db0239bce0a15f18", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.8140528146864066, "ground_truth": 0}, {"key": "8626e8d0c96f4d12eca92423e0c43c6ea3e53545", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.7839884597838248, "ground_truth": 0}, {"key": "8626e8d0c96f4d12eca92423e0c43c6ea3e53545", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.8587185876460275, "ground_truth": 0}, {"key": "8626e8d0c96f4d12eca92423e0c43c6ea3e53545", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.8116760127520825, "ground_truth": 0}, {"key": "8626e8d0c96f4d12eca92423e0c43c6ea3e53545", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.8539127487771528, "ground_truth": 0}, {"key": "8626e8d0c96f4d12eca92423e0c43c6ea3e53545", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.7577943777316447, "ground_truth": 0}, {"key": "f675d806e17d1920e6622d3a925367697c94e58e", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.7956580943366649, "ground_truth": 0}, {"key": "f675d806e17d1920e6622d3a925367697c94e58e", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.7431680230407182, "ground_truth": 0}, {"key": "f675d806e17d1920e6622d3a925367697c94e58e", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.7431680191957744, "ground_truth": 0}, {"key": "f675d806e17d1920e6622d3a925367697c94e58e", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.901920671539019, "ground_truth": 0}, {"key": "f675d806e17d1920e6622d3a925367697c94e58e", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.8918110408134017, "ground_truth": 0}, {"key": "835b6e4637bd2c3fe2644f2cefa00270e950ebdf", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.5214711658968753, "ground_truth": 0}, {"key": "835b6e4637bd2c3fe2644f2cefa00270e950ebdf", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.6943026767907863, "ground_truth": 0}, {"key": "835b6e4637bd2c3fe2644f2cefa00270e950ebdf", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.7866228279729389, "ground_truth": 0}, {"key": "835b6e4637bd2c3fe2644f2cefa00270e950ebdf", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.7138307443748246, "ground_truth": 0}, {"key": "835b6e4637bd2c3fe2644f2cefa00270e950ebdf", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.7446563564394075, "ground_truth": 0}, {"key": "aec90720358f66b9d149db8afd08fbb821e3aa52", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.6297746117460663, "ground_truth": 0}, {"key": "aec90720358f66b9d149db8afd08fbb821e3aa52", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.7592253981954963, "ground_truth": 0}, {"key": "aec90720358f66b9d149db8afd08fbb821e3aa52", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.6548947200640519, "ground_truth": 0}, {"key": "aec90720358f66b9d149db8afd08fbb821e3aa52", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.6992544131635187, "ground_truth": 0}, {"key": "aec90720358f66b9d149db8afd08fbb821e3aa52", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.7704647838737265, "ground_truth": 0}, {"key": "0033829349643e2964a8c3ce5fd997116ce43f7c", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.7892337109329848, "ground_truth": 0}, {"key": "0033829349643e2964a8c3ce5fd997116ce43f7c", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.8766343819796049, "ground_truth": 0}, {"key": "0033829349643e2964a8c3ce5fd997116ce43f7c", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.8740772344753874, "ground_truth": 0}, {"key": "0033829349643e2964a8c3ce5fd997116ce43f7c", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.8697145716317074, "ground_truth": 0}, {"key": "0033829349643e2964a8c3ce5fd997116ce43f7c", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.9161096193248686, "ground_truth": 0}, {"key": "3276a47234f0aa9eb7d4d06940ffb912be059454", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.6388353004536319, "ground_truth": 0}, {"key": "3276a47234f0aa9eb7d4d06940ffb912be059454", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.7690802687974005, "ground_truth": 0}, {"key": "3276a47234f0aa9eb7d4d06940ffb912be059454", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.7264256054351856, "ground_truth": 0}, {"key": "3276a47234f0aa9eb7d4d06940ffb912be059454", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.8311430374318013, "ground_truth": 0}, {"key": "3276a47234f0aa9eb7d4d06940ffb912be059454", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.6169358267542518, "ground_truth": 0}, {"key": "8d3bb51d711ce00e3fff53625a70923985573834", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.831143050879638, "ground_truth": 0}, {"key": "8d3bb51d711ce00e3fff53625a70923985573834", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.7905303096871923, "ground_truth": 0}, {"key": "8d3bb51d711ce00e3fff53625a70923985573834", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.8449215286619008, "ground_truth": 0}, {"key": "8d3bb51d711ce00e3fff53625a70923985573834", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.8558511381780713, "ground_truth": 0}, {"key": "8d3bb51d711ce00e3fff53625a70923985573834", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.6150878376566982, "ground_truth": 0}, {"key": "e43fc7e34d05a75894279f55935b25040a6d7017", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.8221891255020793, "ground_truth": 0}, {"key": "e43fc7e34d05a75894279f55935b25040a6d7017", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.735641628968258, "ground_truth": 0}, {"key": "e43fc7e34d05a75894279f55935b25040a6d7017", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.7772998472542434, "ground_truth": 0}, {"key": "e43fc7e34d05a75894279f55935b25040a6d7017", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.7826624945498677, "ground_truth": 0}, {"key": "e43fc7e34d05a75894279f55935b25040a6d7017", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.840782603164184, "ground_truth": 0}, {"key": "518daa3f4d9f4eb8d3e6dec7852c8b645d1ceb49", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.8697145836744484, "ground_truth": 0}, {"key": "518daa3f4d9f4eb8d3e6dec7852c8b645d1ceb49", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.8539127501392182, "ground_truth": 0}, {"key": "518daa3f4d9f4eb8d3e6dec7852c8b645d1ceb49", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.8902942217638876, "ground_truth": 0}, {"key": "518daa3f4d9f4eb8d3e6dec7852c8b645d1ceb49", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.8322366550843638, "ground_truth": 0}, {"key": "518daa3f4d9f4eb8d3e6dec7852c8b645d1ceb49", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.8233283872252861, "ground_truth": 0}, {"key": "a86f10b66912e0221e9ad4d44c37fc7f4e138ed2", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.9629528284696063, "ground_truth": 0}, {"key": "a86f10b66912e0221e9ad4d44c37fc7f4e138ed2", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.909264518550486, "ground_truth": 0}, {"key": "a86f10b66912e0221e9ad4d44c37fc7f4e138ed2", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.9563089395785717, "ground_truth": 0}, {"key": "a86f10b66912e0221e9ad4d44c37fc7f4e138ed2", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.9645892726000741, "ground_truth": 0}, {"key": "a86f10b66912e0221e9ad4d44c37fc7f4e138ed2", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.9142907236413443, "ground_truth": 0}, {"key": "a34829c5a83a3ef39c34b57b65cc48c9bf11f14b", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.7866228335221026, "ground_truth": 0}, {"key": "a34829c5a83a3ef39c34b57b65cc48c9bf11f14b", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.789233709988809, "ground_truth": 0}, {"key": "a34829c5a83a3ef39c34b57b65cc48c9bf11f14b", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.7401743657145723, "ground_truth": 0}, {"key": "a34829c5a83a3ef39c34b57b65cc48c9bf11f14b", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.870597271343415, "ground_truth": 0}, {"key": "a34829c5a83a3ef39c34b57b65cc48c9bf11f14b", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.8068526170446307, "ground_truth": 0}, {"key": "05c6b2a21f9c0ffd5f0c76c9ce4c6d3d875fcf39", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.6531269101436056, "ground_truth": 0}, {"key": "05c6b2a21f9c0ffd5f0c76c9ce4c6d3d875fcf39", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.862467541169837, "ground_truth": 0}, {"key": "05c6b2a21f9c0ffd5f0c76c9ce4c6d3d875fcf39", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.4532618290645689, "ground_truth": 0}, {"key": "05c6b2a21f9c0ffd5f0c76c9ce4c6d3d875fcf39", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.7310585829620134, "ground_truth": 0}, {"key": "05c6b2a21f9c0ffd5f0c76c9ce4c6d3d875fcf39", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.6825737442812618, "ground_truth": 0}, {"key": "b3e6507640b009ed51c8c8f8be85d0b7fec5b579", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.9449947157690874, "ground_truth": 0}, {"key": "b3e6507640b009ed51c8c8f8be85d0b7fec5b579", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.9445872044255242, "ground_truth": 0}, {"key": "b3e6507640b009ed51c8c8f8be85d0b7fec5b579", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.9399133535319552, "ground_truth": 0}, {"key": "b3e6507640b009ed51c8c8f8be85d0b7fec5b579", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.868826774069284, "ground_truth": 0}, {"key": "b3e6507640b009ed51c8c8f8be85d0b7fec5b579", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.9155072396262686, "ground_truth": 0}, {"key": "6e930c55a62640d218e4b94f39cb7c83b6ad9117", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.4980468694786893, "ground_truth": 0}, {"key": "6e930c55a62640d218e4b94f39cb7c83b6ad9117", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.6531269146405009, "ground_truth": 0}, {"key": "6e930c55a62640d218e4b94f39cb7c83b6ad9117", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.5058591215850693, "ground_truth": 0}, {"key": "6e930c55a62640d218e4b94f39cb7c83b6ad9117", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.4167966727158677, "ground_truth": 0}, {"key": "6e930c55a62640d218e4b94f39cb7c83b6ad9117", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.6352224335281504, "ground_truth": 0}, {"key": "cd13c83364964da3b3659782e6ef0d2b3dc273b1", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.672331696606693, "ground_truth": 0}, {"key": "cd13c83364964da3b3659782e6ef0d2b3dc273b1", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.779992900124114, "ground_truth": 0}, {"key": "cd13c83364964da3b3659782e6ef0d2b3dc273b1", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.7401743560602791, "ground_truth": 0}, {"key": "cd13c83364964da3b3659782e6ef0d2b3dc273b1", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.6808786091371666, "ground_truth": 0}, {"key": "cd13c83364964da3b3659782e6ef0d2b3dc273b1", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.884039281832477, "ground_truth": 0}, {"key": "328210eaa50ae54cc3d979958c1d2008faa27401", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.8278281494797586, "ground_truth": 0}, {"key": "328210eaa50ae54cc3d979958c1d2008faa27401", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.7956580849949136, "ground_truth": 0}, {"key": "328210eaa50ae54cc3d979958c1d2008faa27401", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.8705972664852076, "ground_truth": 0}, {"key": "328210eaa50ae54cc3d979958c1d2008faa27401", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.9130583437148029, "ground_truth": 0}, {"key": "328210eaa50ae54cc3d979958c1d2008faa27401", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.8080672114967429, "ground_truth": 0}, {"key": "b67b63d1da9cccd6e229d5755065d57dd1653feb", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.8864204129771983, "ground_truth": 0}, {"key": "b67b63d1da9cccd6e229d5755065d57dd1653feb", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.8519528091439206, "ground_truth": 0}, {"key": "b67b63d1da9cccd6e229d5755065d57dd1653feb", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.895522680622704, "ground_truth": 0}, {"key": "b67b63d1da9cccd6e229d5755065d57dd1653feb", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.8322366550640962, "ground_truth": 0}, {"key": "b67b63d1da9cccd6e229d5755065d57dd1653feb", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.8824278700909095, "ground_truth": 0}, {"key": "e4c55cb4bb6e5418d8486fb7c9369b6c84b2716d", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.8740772282099576, "ground_truth": 0}, {"key": "e4c55cb4bb6e5418d8486fb7c9369b6c84b2716d", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.8933094042332754, "ground_truth": 0}, {"key": "e4c55cb4bb6e5418d8486fb7c9369b6c84b2716d", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.7662936527502191, "ground_truth": 0}, {"key": "e4c55cb4bb6e5418d8486fb7c9369b6c84b2716d", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.9235923178176517, "ground_truth": 0}, {"key": "e4c55cb4bb6e5418d8486fb7c9369b6c84b2716d", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.720171497308867, "ground_truth": 0}, {"key": "544b165ad1d22a5dcbbab469a2aa7666c2868361", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.7520126043756815, "ground_truth": 0}, {"key": "544b165ad1d22a5dcbbab469a2aa7666c2868361", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.7759445578689335, "ground_truth": 0}, {"key": "544b165ad1d22a5dcbbab469a2aa7666c2868361", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.750552760805423, "ground_truth": 0}, {"key": "544b165ad1d22a5dcbbab469a2aa7666c2868361", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.7233094739085397, "ground_truth": 0}, {"key": "544b165ad1d22a5dcbbab469a2aa7666c2868361", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.7476159465315778, "ground_truth": 0}, {"key": "2577ef64a22c06cf63cb244abfad9ecc46603208", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.7577943597796414, "ground_truth": 0}, {"key": "2577ef64a22c06cf63cb244abfad9ecc46603208", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.794384950588825, "ground_truth": 0}, {"key": "2577ef64a22c06cf63cb244abfad9ecc46603208", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.8116760211734496, "ground_truth": 0}, {"key": "2577ef64a22c06cf63cb244abfad9ecc46603208", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.6619228632853316, "ground_truth": 0}, {"key": "2577ef64a22c06cf63cb244abfad9ecc46603208", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.8688267763166604, "ground_truth": 0}, {"key": "2a73430dd3232ad3da7570a5ac133d7f29a6b6c6", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.8783142444327193, "ground_truth": 0}, {"key": "2a73430dd3232ad3da7570a5ac133d7f29a6b6c6", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.9241418242564589, "ground_truth": 0}, {"key": "2a73430dd3232ad3da7570a5ac133d7f29a6b6c6", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.9257686286876375, "ground_truth": 0}, {"key": "2a73430dd3232ad3da7570a5ac133d7f29a6b6c6", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.7676898683237416, "ground_truth": 0}, {"key": "2a73430dd3232ad3da7570a5ac133d7f29a6b6c6", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.9124361604612872, "ground_truth": 0}, {"key": "8fbcaf3abc124b7baaa278d382411f43e7e48353", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.85293546921224, "ground_truth": 0}, {"key": "8fbcaf3abc124b7baaa278d382411f43e7e48353", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.9196425381681965, "ground_truth": 0}, {"key": "8fbcaf3abc124b7baaa278d382411f43e7e48353", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.8438951021495991, "ground_truth": 0}, {"key": "8fbcaf3abc124b7baaa278d382411f43e7e48353", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.878314252446281, "ground_truth": 0}, {"key": "8fbcaf3abc124b7baaa278d382411f43e7e48353", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.901920677075459, "ground_truth": 0}, {"key": "bc04e5a298854589044eb5a162f281f3e7e12c16", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.5832033824199223, "ground_truth": 0}, {"key": "bc04e5a298854589044eb5a162f281f3e7e12c16", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.47268345867468403, "ground_truth": 0}, {"key": "bc04e5a298854589044eb5a162f281f3e7e12c16", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.5175708866230246, "ground_truth": 0}, {"key": "bc04e5a298854589044eb5a162f281f3e7e12c16", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.42059960870132007, "ground_truth": 0}, {"key": "bc04e5a298854589044eb5a162f281f3e7e12c16", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.5964331475256748, "ground_truth": 0}, {"key": "8c3b7358950d0684a90736fc39d08340d3ec41ee", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.8529354765081247, "ground_truth": 0}, {"key": "8c3b7358950d0684a90736fc39d08340d3ec41ee", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.7956580980682686, "ground_truth": 0}, {"key": "8c3b7358950d0684a90736fc39d08340d3ec41ee", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.44939263433908416, "ground_truth": 0}, {"key": "8c3b7358950d0684a90736fc39d08340d3ec41ee", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.8766343815912265, "ground_truth": 0}, {"key": "8c3b7358950d0684a90736fc39d08340d3ec41ee", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.7416740210761683, "ground_truth": 0}, {"key": "d1a86381ca59e3471d2863688229922f83218150", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.8661325147084561, "ground_truth": 0}, {"key": "d1a86381ca59e3471d2863688229922f83218150", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.896975570358662, "ground_truth": 0}, {"key": "d1a86381ca59e3471d2863688229922f83218150", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.8255897253845772, "ground_truth": 0}, {"key": "d1a86381ca59e3471d2863688229922f83218150", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.8080672032715283, "ground_truth": 0}, {"key": "d1a86381ca59e3471d2863688229922f83218150", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.8991213797823058, "ground_truth": 0}, {"key": "313d98f4c6047ff556795b6da47e42e9f650946a", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.8365545564593958, "ground_truth": 0}, {"key": "313d98f4c6047ff556795b6da47e42e9f650946a", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.7799929000956931, "ground_truth": 0}, {"key": "313d98f4c6047ff556795b6da47e42e9f650946a", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.5679366014908427, "ground_truth": 0}, {"key": "313d98f4c6047ff556795b6da47e42e9f650946a", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.7138307311398193, "ground_truth": 0}, {"key": "313d98f4c6047ff556795b6da47e42e9f650946a", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.7704647890217614, "ground_truth": 0}, {"key": "8c0934c689bbc9234dc51eff9d8d156aec106ca4", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.8568122939955872, "ground_truth": 0}, {"key": "8c0934c689bbc9234dc51eff9d8d156aec106ca4", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.9173026583497027, "ground_truth": 0}, {"key": "8c0934c689bbc9234dc51eff9d8d156aec106ca4", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.7217432315536708, "ground_truth": 0}, {"key": "8c0934c689bbc9234dc51eff9d8d156aec106ca4", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.7905303056738208, "ground_truth": 0}, {"key": "8c0934c689bbc9234dc51eff9d8d156aec106ca4", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.913058339111227, "ground_truth": 0}, {"key": "70f210b63211c32ab22354506b7bd9b80ee194af", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.8652240817826112, "ground_truth": 0}, {"key": "70f210b63211c32ab22354506b7bd9b80ee194af", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.8322366559336459, "ground_truth": 0}, {"key": "70f210b63211c32ab22354506b7bd9b80ee194af", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.8606036162906818, "ground_truth": 0}, {"key": "70f210b63211c32ab22354506b7bd9b80ee194af", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.8006920009187412, "ground_truth": 0}, {"key": "70f210b63211c32ab22354506b7bd9b80ee194af", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.9118099512547201, "ground_truth": 0}, {"key": "dea4bf4a53b568dea8b3d5009a24d090485be8c9", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.852935474113933, "ground_truth": 0}, {"key": "dea4bf4a53b568dea8b3d5009a24d090485be8c9", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.74761595631743, "ground_truth": 0}, {"key": "dea4bf4a53b568dea8b3d5009a24d090485be8c9", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.8152324864220188, "ground_truth": 0}, {"key": "dea4bf4a53b568dea8b3d5009a24d090485be8c9", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.8558511548604475, "ground_truth": 0}, {"key": "dea4bf4a53b568dea8b3d5009a24d090485be8c9", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.8661325014557808, "ground_truth": 0}, {"key": "3ffb4210cf832dc039ffe7522c47c6eb7a5e5ab5", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.7057850210766572, "ground_truth": 0}, {"key": "3ffb4210cf832dc039ffe7522c47c6eb7a5e5ab5", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.6424325169547827, "ground_truth": 0}, {"key": "3ffb4210cf832dc039ffe7522c47c6eb7a5e5ab5", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.7248702818295836, "ground_truth": 0}, {"key": "3ffb4210cf832dc039ffe7522c47c6eb7a5e5ab5", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.8068526165955804, "ground_truth": 0}, {"key": "3ffb4210cf832dc039ffe7522c47c6eb7a5e5ab5", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.874934615918126, "ground_truth": 0}, {"key": "c010d72bf64ac4e1c758b7f078aeed89bc57a9db", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.8164063728845004, "ground_truth": 0}, {"key": "c010d72bf64ac4e1c758b7f078aeed89bc57a9db", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.7008948130927071, "ground_truth": 0}, {"key": "c010d72bf64ac4e1c758b7f078aeed89bc57a9db", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.8044059108708275, "ground_truth": 0}, {"key": "c010d72bf64ac4e1c758b7f078aeed89bc57a9db", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.7969253796542698, "ground_truth": 0}, {"key": "c010d72bf64ac4e1c758b7f078aeed89bc57a9db", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.8152324870312572, "ground_truth": 0}, {"key": "343644770a597a2dfa7548ba165fa9c6bdc88245", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.7490872133960844, "ground_truth": 0}, {"key": "343644770a597a2dfa7548ba165fa9c6bdc88245", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.800691999018636, "ground_truth": 0}, {"key": "343644770a597a2dfa7548ba165fa9c6bdc88245", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.825589723769509, "ground_truth": 0}, {"key": "343644770a597a2dfa7548ba165fa9c6bdc88245", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.7534666568370748, "ground_truth": 0}, {"key": "343644770a597a2dfa7548ba165fa9c6bdc88245", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.8255897143081871, "ground_truth": 0}, {"key": "4b89e8a6a25de61d21a1fed20fb911cd4b1e4b47", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.7490872193800336, "ground_truth": 0}, {"key": "4b89e8a6a25de61d21a1fed20fb911cd4b1e4b47", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.8152324839192274, "ground_truth": 0}, {"key": "4b89e8a6a25de61d21a1fed20fb911cd4b1e4b47", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.7264256049369677, "ground_truth": 0}, {"key": "4b89e8a6a25de61d21a1fed20fb911cd4b1e4b47", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.8489721962557594, "ground_truth": 0}, {"key": "4b89e8a6a25de61d21a1fed20fb911cd4b1e4b47", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.7461389836679124, "ground_truth": 0}, {"key": "9b382d27692cb18aa61af350038b175b3ce75e2b", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.6261241838592256, "ground_truth": 0}, {"key": "9b382d27692cb18aa61af350038b175b3ce75e2b", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.6352224471769531, "ground_truth": 0}, {"key": "9b382d27692cb18aa61af350038b175b3ce75e2b", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.7490872134236602, "ground_truth": 0}, {"key": "9b382d27692cb18aa61af350038b175b3ce75e2b", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.6001883284161411, "ground_truth": 0}, {"key": "9b382d27692cb18aa61af350038b175b3ce75e2b", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.6909762972011505, "ground_truth": 0}, {"key": "59be27355e5b86754678f70254cfbb1e6dc8bf0c", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.8068526067665781, "ground_truth": 0}, {"key": "59be27355e5b86754678f70254cfbb1e6dc8bf0c", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.7892336986166808, "ground_truth": 0}, {"key": "59be27355e5b86754678f70254cfbb1e6dc8bf0c", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.8558511460945062, "ground_truth": 0}, {"key": "59be27355e5b86754678f70254cfbb1e6dc8bf0c", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.6757646271941763, "ground_truth": 0}, {"key": "59be27355e5b86754678f70254cfbb1e6dc8bf0c", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.7892336884261267, "ground_truth": 0}, {"key": "ff10934c1dc127286575fb1a6b192da6da21f235", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.8449215287048247, "ground_truth": 0}, {"key": "ff10934c1dc127286575fb1a6b192da6da21f235", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.7074046872062387, "ground_truth": 0}, {"key": "ff10934c1dc127286575fb1a6b192da6da21f235", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.6442251264354232, "ground_truth": 0}, {"key": "ff10934c1dc127286575fb1a6b192da6da21f235", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.7994423148633771, "ground_truth": 0}, {"key": "ff10934c1dc127286575fb1a6b192da6da21f235", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.705785020667032, "ground_truth": 0}, {"key": "1997690ceabc952c3396cb2a30e9050241f6f6c7", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.6859494475715668, "ground_truth": 0}, {"key": "1997690ceabc952c3396cb2a30e9050241f6f6c7", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.7356416273349788, "ground_truth": 0}, {"key": "1997690ceabc952c3396cb2a30e9050241f6f6c7", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.6740504647382672, "ground_truth": 0}, {"key": "1997690ceabc952c3396cb2a30e9050241f6f6c7", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.7217432182277791, "ground_truth": 0}, {"key": "1997690ceabc952c3396cb2a30e9050241f6f6c7", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.6671476755086145, "ground_truth": 0}, {"key": "c676027eea6109621206e3864c4eea30912fe09f", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.6671476697156463, "ground_truth": 0}, {"key": "c676027eea6109621206e3864c4eea30912fe09f", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.649578625504957, "ground_truth": 0}, {"key": "c676027eea6109621206e3864c4eea30912fe09f", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.7690802422836155, "ground_truth": 0}, {"key": "c676027eea6109621206e3864c4eea30912fe09f", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.8774767900396203, "ground_truth": 0}, {"key": "c676027eea6109621206e3864c4eea30912fe09f", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.5679366166029848, "ground_truth": 0}, {"key": "78e22dd79495204cf719e3728927241bb60b80e1", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.7295197717914884, "ground_truth": 0}, {"key": "78e22dd79495204cf719e3728927241bb60b80e1", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.7461389957477482, "ground_truth": 0}, {"key": "78e22dd79495204cf719e3728927241bb60b80e1", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.709019134979535, "ground_truth": 0}, {"key": "78e22dd79495204cf719e3728927241bb60b80e1", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.7170118621985055, "ground_truth": 0}, {"key": "78e22dd79495204cf719e3728927241bb60b80e1", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.7606506569593446, "ground_truth": 0}, {"key": "6c1a1cf59028ba2567b0a1941e510c40133da1c0", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.7704647831525115, "ground_truth": 0}, {"key": "6c1a1cf59028ba2567b0a1941e510c40133da1c0", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.8365545593467897, "ground_truth": 0}, {"key": "6c1a1cf59028ba2567b0a1941e510c40133da1c0", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.7106282935619168, "ground_truth": 0}, {"key": "6c1a1cf59028ba2567b0a1941e510c40133da1c0", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.8670357631483032, "ground_truth": 0}, {"key": "6c1a1cf59028ba2567b0a1941e510c40133da1c0", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.8068526147043915, "ground_truth": 0}, {"key": "e8bbd5a77edf96611a4b8efcfbc625ec65985e98", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.9066531195942135, "ground_truth": 0}, {"key": "e8bbd5a77edf96611a4b8efcfbc625ec65985e98", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.9130583359306882, "ground_truth": 0}, {"key": "e8bbd5a77edf96611a4b8efcfbc625ec65985e98", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.8548846405315391, "ground_truth": 0}, {"key": "e8bbd5a77edf96611a4b8efcfbc625ec65985e98", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.9161096160298348, "ground_truth": 0}, {"key": "e8bbd5a77edf96611a4b8efcfbc625ec65985e98", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.9481545310481984, "ground_truth": 0}, {"key": "4141e012912dbf29c5e792b8654a9a36094b468c", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.8577681109914037, "ground_truth": 0}, {"key": "4141e012912dbf29c5e792b8654a9a36094b468c", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.9142907219088446, "ground_truth": 0}, {"key": "4141e012912dbf29c5e792b8654a9a36094b468c", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.8791467723229369, "ground_truth": 0}, {"key": "4141e012912dbf29c5e792b8654a9a36094b468c", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.8175744794467636, "ground_truth": 0}, {"key": "4141e012912dbf29c5e792b8654a9a36094b468c", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.7956581049576715, "ground_truth": 0}, {"key": "d80fa94dc14601e4b82321e2cf749d6915251a70", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.7981867659180311, "ground_truth": 0}, {"key": "d80fa94dc14601e4b82321e2cf749d6915251a70", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.8175744678878862, "ground_truth": 0}, {"key": "d80fa94dc14601e4b82321e2cf749d6915251a70", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.6893056164023167, "ground_truth": 0}, {"key": "d80fa94dc14601e4b82321e2cf749d6915251a70", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.8068526271140698, "ground_truth": 0}, {"key": "d80fa94dc14601e4b82321e2cf749d6915251a70", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.6601723751628097, "ground_truth": 0}, {"key": "11e57b8ed79c4f4b110d81a5cd7152d42411c7a6", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.8311430410788101, "ground_truth": 0}, {"key": "11e57b8ed79c4f4b110d81a5cd7152d42411c7a6", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.6460136891649393, "ground_truth": 0}, {"key": "11e57b8ed79c4f4b110d81a5cd7152d42411c7a6", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.8587185754638629, "ground_truth": 0}, {"key": "11e57b8ed79c4f4b110d81a5cd7152d42411c7a6", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.8670357541823672, "ground_truth": 0}, {"key": "11e57b8ed79c4f4b110d81a5cd7152d42411c7a6", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.7918210518648989, "ground_truth": 0}, {"key": "b55c390e81c5d1d4fa077338d9daaed8978f710b", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.8479677510025545, "ground_truth": 0}, {"key": "b55c390e81c5d1d4fa077338d9daaed8978f710b", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.7577943627068013, "ground_truth": 0}, {"key": "b55c390e81c5d1d4fa077338d9daaed8978f710b", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.8643104464885978, "ground_truth": 0}, {"key": "b55c390e81c5d1d4fa077338d9daaed8978f710b", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.8489722041835921, "ground_truth": 0}, {"key": "b55c390e81c5d1d4fa077338d9daaed8978f710b", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.8615382107670342, "ground_truth": 0}, {"key": "d46e1849cbbf875ccd018fd778fa6c433cab4694", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.9005297881852656, "ground_truth": 0}, {"key": "d46e1849cbbf875ccd018fd778fa6c433cab4694", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.9019206744971883, "ground_truth": 0}, {"key": "d46e1849cbbf875ccd018fd778fa6c433cab4694", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.8386797554814659, "ground_truth": 0}, {"key": "d46e1849cbbf875ccd018fd778fa6c433cab4694", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.8840392857131545, "ground_truth": 0}, {"key": "d46e1849cbbf875ccd018fd778fa6c433cab4694", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.7943849722731248, "ground_truth": 0}, {"key": "09b582acc63514f671628e1766ff7e99b258fe9a", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.7648916179962345, "ground_truth": 0}, {"key": "09b582acc63514f671628e1766ff7e99b258fe9a", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.8386797507841185, "ground_truth": 0}, {"key": "09b582acc63514f671628e1766ff7e99b258fe9a", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.7620701043438951, "ground_truth": 0}, {"key": "09b582acc63514f671628e1766ff7e99b258fe9a", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.8428631423141982, "ground_truth": 0}, {"key": "09b582acc63514f671628e1766ff7e99b258fe9a", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.6825737094459932, "ground_truth": 0}, {"key": "c4afe4db222c094c40bb3f271e37e006bcbebf88", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.7732163764212119, "ground_truth": 0}, {"key": "c4afe4db222c094c40bb3f271e37e006bcbebf88", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.8152324955271899, "ground_truth": 0}, {"key": "c4afe4db222c094c40bb3f271e37e006bcbebf88", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.7431679860225193, "ground_truth": 0}, {"key": "c4afe4db222c094c40bb3f271e37e006bcbebf88", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.7264256049098804, "ground_truth": 0}, {"key": "c4afe4db222c094c40bb3f271e37e006bcbebf88", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.69097628048171, "ground_truth": 0}, {"key": "e21871892c63ec9638bf1bd3c3a1c3ebdae88796", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.86613250483225, "ground_truth": 0}, {"key": "e21871892c63ec9638bf1bd3c3a1c3ebdae88796", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.941654162181995, "ground_truth": 0}, {"key": "e21871892c63ec9638bf1bd3c3a1c3ebdae88796", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.8643104573051346, "ground_truth": 0}, {"key": "e21871892c63ec9638bf1bd3c3a1c3ebdae88796", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.8933094011299084, "ground_truth": 0}, {"key": "e21871892c63ec9638bf1bd3c3a1c3ebdae88796", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.8596637567532202, "ground_truth": 0}, {"key": "065378e265a6d5ff38b2e6748ba66490cf8670a9", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.7662936536966973, "ground_truth": 0}, {"key": "065378e265a6d5ff38b2e6748ba66490cf8670a9", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.5774953606014381, "ground_truth": 0}, {"key": "065378e265a6d5ff38b2e6748ba66490cf8670a9", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.6460137019706053, "ground_truth": 0}, {"key": "065378e265a6d5ff38b2e6748ba66490cf8670a9", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.7813306267294869, "ground_truth": 0}, {"key": "065378e265a6d5ff38b2e6748ba66490cf8670a9", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.803173794368867, "ground_truth": 0}, {"key": "5852e143b34cc30e94aed29193fc2e1dce37b1b1", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.7732163683238132, "ground_truth": 0}, {"key": "5852e143b34cc30e94aed29193fc2e1dce37b1b1", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.7310585503377613, "ground_truth": 0}, {"key": "5852e143b34cc30e94aed29193fc2e1dce37b1b1", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.682573744206778, "ground_truth": 0}, {"key": "5852e143b34cc30e94aed29193fc2e1dce37b1b1", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.8140527856131999, "ground_truth": 0}, {"key": "5852e143b34cc30e94aed29193fc2e1dce37b1b1", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.7606506612086522, "ground_truth": 0}, {"key": "af76b4c33b65666487dcc07f75d37de03ff61207", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.7592253907765464, "ground_truth": 0}, {"key": "af76b4c33b65666487dcc07f75d37de03ff61207", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.8529354739036634, "ground_truth": 0}, {"key": "af76b4c33b65666487dcc07f75d37de03ff61207", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.7732163758928203, "ground_truth": 0}, {"key": "af76b4c33b65666487dcc07f75d37de03ff61207", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.6992543990280816, "ground_truth": 0}, {"key": "af76b4c33b65666487dcc07f75d37de03ff61207", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.8344068917412276, "ground_truth": 0}, {"key": "9918924dbaed44429c58ea3638c3847317b71127", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.7690802447831941, "ground_truth": 0}, {"key": "9918924dbaed44429c58ea3638c3847317b71127", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.8244619214627015, "ground_truth": 0}, {"key": "9918924dbaed44429c58ea3638c3847317b71127", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.8344068882984963, "ground_truth": 0}, {"key": "9918924dbaed44429c58ea3638c3847317b71127", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.6688802653628794, "ground_truth": 0}, {"key": "9918924dbaed44429c58ea3638c3847317b71127", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.8175744667566637, "ground_truth": 0}, {"key": "c87e99f422b46c03ce77e7cd064bff87c076e1ed", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.5583269830708565, "ground_truth": 0}, {"key": "c87e99f422b46c03ce77e7cd064bff87c076e1ed", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.767689845224152, "ground_truth": 0}, {"key": "c87e99f422b46c03ce77e7cd064bff87c076e1ed", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.7577943571151641, "ground_truth": 0}, {"key": "c87e99f422b46c03ce77e7cd064bff87c076e1ed", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.8679338487182491, "ground_truth": 0}, {"key": "c87e99f422b46c03ce77e7cd064bff87c076e1ed", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.7233094660508254, "ground_truth": 0}, {"key": "aaca402152fbea1b16e14999374f6394520289a8", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.9433475754651414, "ground_truth": 0}, {"key": "aaca402152fbea1b16e14999374f6394520289a8", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.9066531215647398, "ground_truth": 0}, {"key": "aaca402152fbea1b16e14999374f6394520289a8", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.9591542816232255, "ground_truth": 0}, {"key": "aaca402152fbea1b16e14999374f6394520289a8", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.8807970767643117, "ground_truth": 0}, {"key": "aaca402152fbea1b16e14999374f6394520289a8", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.9549844699221328, "ground_truth": 0}, {"key": "259d8cccfcb9b9edc00d757ec6efecde6fc06110", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.702530059888464, "ground_truth": 0}, {"key": "259d8cccfcb9b9edc00d757ec6efecde6fc06110", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.8333246012864387, "ground_truth": 0}, {"key": "259d8cccfcb9b9edc00d757ec6efecde6fc06110", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.6757645973841644, "ground_truth": 0}, {"key": "259d8cccfcb9b9edc00d757ec6efecde6fc06110", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.8278281571244347, "ground_truth": 0}, {"key": "259d8cccfcb9b9edc00d757ec6efecde6fc06110", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.7676898632006413, "ground_truth": 0}, {"key": "d076dbce6e84b20153db61c809d0f01f46ef1f45", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.8749346190049268, "ground_truth": 0}, {"key": "d076dbce6e84b20153db61c809d0f01f46ef1f45", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.8175744723058489, "ground_truth": 0}, {"key": "d076dbce6e84b20153db61c809d0f01f46ef1f45", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.883235989771206, "ground_truth": 0}, {"key": "d076dbce6e84b20153db61c809d0f01f46ef1f45", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.9032942114381838, "ground_truth": 0}, {"key": "d076dbce6e84b20153db61c809d0f01f46ef1f45", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.8529354789789295, "ground_truth": 0}, {"key": "c74e983d24450ed9c4ba3a97e345bba707d26853", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.8187368006921222, "ground_truth": 0}, {"key": "c74e983d24450ed9c4ba3a97e345bba707d26853", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.7853085810234947, "ground_truth": 0}, {"key": "c74e983d24450ed9c4ba3a97e345bba707d26853", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.738669069395507, "ground_truth": 0}, {"key": "c74e983d24450ed9c4ba3a97e345bba707d26853", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.80563217767733, "ground_truth": 0}, {"key": "c74e983d24450ed9c4ba3a97e345bba707d26853", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.8044059089351152, "ground_truth": 0}, {"key": "0922357b2d0439cf4ba6ec9dc143e11a38b49d8a", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.6531268989141328, "ground_truth": 0}, {"key": "0922357b2d0439cf4ba6ec9dc143e11a38b49d8a", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.7994423265799204, "ground_truth": 0}, {"key": "0922357b2d0439cf4ba6ec9dc143e11a38b49d8a", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.7931059545394792, "ground_truth": 0}, {"key": "0922357b2d0439cf4ba6ec9dc143e11a38b49d8a", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.8068526194992857, "ground_truth": 0}, {"key": "0922357b2d0439cf4ba6ec9dc143e11a38b49d8a", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.6039318430026037, "ground_truth": 0}, {"key": "c62ea6aaf31a7f5b6a7c2eac7780c86f9baed786", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.8289388273239541, "ground_truth": 0}, {"key": "c62ea6aaf31a7f5b6a7c2eac7780c86f9baed786", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.9235923162471613, "ground_truth": 0}, {"key": "c62ea6aaf31a7f5b6a7c2eac7780c86f9baed786", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.6001883547170722, "ground_truth": 0}, {"key": "c62ea6aaf31a7f5b6a7c2eac7780c86f9baed786", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.6740504635551551, "ground_truth": 0}, {"key": "c62ea6aaf31a7f5b6a7c2eac7780c86f9baed786", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.6959583240826449, "ground_truth": 0}, {"key": "6bb04883f35820a450ff821eda46a4002c0fc7e9", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.8459424473168895, "ground_truth": 0}, {"key": "6bb04883f35820a450ff821eda46a4002c0fc7e9", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.6959583352676523, "ground_truth": 0}, {"key": "6bb04883f35820a450ff821eda46a4002c0fc7e9", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.7718435246880399, "ground_truth": 0}, {"key": "6bb04883f35820a450ff821eda46a4002c0fc7e9", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.8848377804404098, "ground_truth": 0}, {"key": "6bb04883f35820a450ff821eda46a4002c0fc7e9", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.8044059106867572, "ground_truth": 0}, {"key": "71f87a7cbda73f1c0656d811b0026437e4ee4aa0", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.9219218390634115, "ground_truth": 0}, {"key": "71f87a7cbda73f1c0656d811b0026437e4ee4aa0", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.9367494791997125, "ground_truth": 0}, {"key": "71f87a7cbda73f1c0656d811b0026437e4ee4aa0", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.9385759643403989, "ground_truth": 0}, {"key": "71f87a7cbda73f1c0656d811b0026437e4ee4aa0", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.9284087998184705, "ground_truth": 0}, {"key": "71f87a7cbda73f1c0656d811b0026437e4ee4aa0", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.9053222975978206, "ground_truth": 0}, {"key": "fa5089d759a9fb810d28c140cf60e3a5fffff8ba", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.8824278619477107, "ground_truth": 0}, {"key": "fa5089d759a9fb810d28c140cf60e3a5fffff8ba", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.6992544482435937, "ground_truth": 0}, {"key": "fa5089d759a9fb810d28c140cf60e3a5fffff8ba", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.8887587865640317, "ground_truth": 0}, {"key": "fa5089d759a9fb810d28c140cf60e3a5fffff8ba", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.8933094051009939, "ground_truth": 0}, {"key": "fa5089d759a9fb810d28c140cf60e3a5fffff8ba", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.8116760172439798, "ground_truth": 0}, {"key": "1f9aed77465301d7f3787a29555754a03728c4b7", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.8955226849696247, "ground_truth": 0}, {"key": "1f9aed77465301d7f3787a29555754a03728c4b7", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.7772998538760497, "ground_truth": 0}, {"key": "1f9aed77465301d7f3787a29555754a03728c4b7", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.8548846389107361, "ground_truth": 0}, {"key": "1f9aed77465301d7f3787a29555754a03728c4b7", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.9600626825110314, "ground_truth": 0}, {"key": "1f9aed77465301d7f3787a29555754a03728c4b7", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.9105454020792422, "ground_truth": 0}, {"key": "7237201bcb7291f2ededb818f901a451356db34b", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.7943849715373474, "ground_truth": 0}, {"key": "7237201bcb7291f2ededb818f901a451356db34b", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.8596637495146893, "ground_truth": 0}, {"key": "7237201bcb7291f2ededb818f901a451356db34b", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.8887587894956562, "ground_truth": 0}, {"key": "7237201bcb7291f2ededb818f901a451356db34b", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.8344068874736231, "ground_truth": 0}, {"key": "7237201bcb7291f2ededb818f901a451356db34b", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.9073122188811599, "ground_truth": 0}, {"key": "38d13d78fedc889784ffb3cb213a758c758be145", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.6370307795335537, "ground_truth": 0}, {"key": "38d13d78fedc889784ffb3cb213a758c758be145", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.7994423265799204, "ground_truth": 0}, {"key": "38d13d78fedc889784ffb3cb213a758c758be145", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.7264255985849235, "ground_truth": 0}, {"key": "38d13d78fedc889784ffb3cb213a758c758be145", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.7138307564595724, "ground_truth": 0}, {"key": "38d13d78fedc889784ffb3cb213a758c758be145", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.7341195324819956, "ground_truth": 0}, {"key": "98fd4b91ec12241a96493471a3e21c9ab96ec523", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.8164063672561783, "ground_truth": 0}, {"key": "98fd4b91ec12241a96493471a3e21c9ab96ec523", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.9529258208886447, "ground_truth": 0}, {"key": "98fd4b91ec12241a96493471a3e21c9ab96ec523", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.9246876945626447, "ground_truth": 0}, {"key": "98fd4b91ec12241a96493471a3e21c9ab96ec523", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.9252299520204625, "ground_truth": 0}, {"key": "98fd4b91ec12241a96493471a3e21c9ab96ec523", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.8933094091137675, "ground_truth": 0}, {"key": "8cefdd23a829375abeb18b9bd44bb053a67dfdf8", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.773216369088377, "ground_truth": 0}, {"key": "8cefdd23a829375abeb18b9bd44bb053a67dfdf8", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.8438951073489552, "ground_truth": 0}, {"key": "8cefdd23a829375abeb18b9bd44bb053a67dfdf8", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.7718434790231755, "ground_truth": 0}, {"key": "8cefdd23a829375abeb18b9bd44bb053a67dfdf8", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.8056321720130873, "ground_truth": 0}, {"key": "8cefdd23a829375abeb18b9bd44bb053a67dfdf8", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.6943026725379405, "ground_truth": 0}, {"key": "3de916a84cae6c1dee0076f4e5d6e26fc95c3242", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.7534666569353137, "ground_truth": 0}, {"key": "3de916a84cae6c1dee0076f4e5d6e26fc95c3242", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.7931059536035127, "ground_truth": 0}, {"key": "3de916a84cae6c1dee0076f4e5d6e26fc95c3242", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.8278281596663587, "ground_truth": 0}, {"key": "3de916a84cae6c1dee0076f4e5d6e26fc95c3242", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.8386797693002118, "ground_truth": 0}, {"key": "3de916a84cae6c1dee0076f4e5d6e26fc95c3242", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.7676898277498544, "ground_truth": 0}, {"key": "24611abacb038c28a84c76b10165e474ac0fdd7e", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.8933094103334811, "ground_truth": 0}, {"key": "24611abacb038c28a84c76b10165e474ac0fdd7e", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.8816149012509708, "ground_truth": 0}, {"key": "24611abacb038c28a84c76b10165e474ac0fdd7e", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.8198933388858011, "ground_truth": 0}, {"key": "24611abacb038c28a84c76b10165e474ac0fdd7e", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.8633915990436198, "ground_truth": 0}, {"key": "24611abacb038c28a84c76b10165e474ac0fdd7e", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.7826624822160089, "ground_truth": 0}, {"key": "4f3178963b84a0e3625f7486b045872c665073d7", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.6706082769948348, "ground_truth": 0}, {"key": "4f3178963b84a0e3625f7486b045872c665073d7", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.8244619340619606, "ground_truth": 0}, {"key": "4f3178963b84a0e3625f7486b045872c665073d7", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.712232174969766, "ground_truth": 0}, {"key": "4f3178963b84a0e3625f7486b045872c665073d7", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.7786493089161044, "ground_truth": 0}, {"key": "4f3178963b84a0e3625f7486b045872c665073d7", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.6893056011345463, "ground_truth": 0}, {"key": "6ff0470115b556c80229f4305c23afa683c9f8da", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.8068526332401514, "ground_truth": 0}, {"key": "6ff0470115b556c80229f4305c23afa683c9f8da", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.7505527668338189, "ground_truth": 0}, {"key": "6ff0470115b556c80229f4305c23afa683c9f8da", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.7772998676295401, "ground_truth": 0}, {"key": "6ff0470115b556c80229f4305c23afa683c9f8da", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.6095241628067771, "ground_truth": 0}, {"key": "6ff0470115b556c80229f4305c23afa683c9f8da", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.8322366509080903, "ground_truth": 0}, {"key": "4be9a7e5e9115eb681541c4a8d247ac84f0eb774", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.7549150028166418, "ground_truth": 0}, {"key": "4be9a7e5e9115eb681541c4a8d247ac84f0eb774", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.6723317075188336, "ground_truth": 0}, {"key": "4be9a7e5e9115eb681541c4a8d247ac84f0eb774", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.8397339691944019, "ground_truth": 0}, {"key": "4be9a7e5e9115eb681541c4a8d247ac84f0eb774", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.8128673210362812, "ground_truth": 0}, {"key": "4be9a7e5e9115eb681541c4a8d247ac84f0eb774", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.8529354738006014, "ground_truth": 0}, {"key": "de3ba4e29501a10effcbb5a61e7b9c0ab3721669", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.9118099554840938, "ground_truth": 0}, {"key": "de3ba4e29501a10effcbb5a61e7b9c0ab3721669", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.9059898110382633, "ground_truth": 0}, {"key": "de3ba4e29501a10effcbb5a61e7b9c0ab3721669", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.8661325106906592, "ground_truth": 0}, {"key": "de3ba4e29501a10effcbb5a61e7b9c0ab3721669", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.8479677608766183, "ground_truth": 0}, {"key": "de3ba4e29501a10effcbb5a61e7b9c0ab3721669", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.9190632870229973, "ground_truth": 0}, {"key": "d23090b75384c925e7f20b1ec5218394b52eae38", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.8661325085234012, "ground_truth": 0}, {"key": "d23090b75384c925e7f20b1ec5218394b52eae38", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.8354835473331741, "ground_truth": 0}, {"key": "d23090b75384c925e7f20b1ec5218394b52eae38", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.8732148315210858, "ground_truth": 0}, {"key": "d23090b75384c925e7f20b1ec5218394b52eae38", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.8732148302534742, "ground_truth": 0}, {"key": "d23090b75384c925e7f20b1ec5218394b52eae38", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.8187367964322515, "ground_truth": 0}, {"key": "98008fdd5ea99bc7c437d6e1aa86c750bf667415", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.6169358198106476, "ground_truth": 0}, {"key": "98008fdd5ea99bc7c437d6e1aa86c750bf667415", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.7563575465203627, "ground_truth": 0}, {"key": "98008fdd5ea99bc7c437d6e1aa86c750bf667415", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.6992544121474663, "ground_truth": 0}, {"key": "98008fdd5ea99bc7c437d6e1aa86c750bf667415", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.843895106449942, "ground_truth": 0}, {"key": "98008fdd5ea99bc7c437d6e1aa86c750bf667415", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.5717666183675879, "ground_truth": 0}, {"key": "fd13c81373473f862d0f3559ffbc2a03fa95f492", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.47268347563965185, "ground_truth": 0}, {"key": "fd13c81373473f862d0f3559ffbc2a03fa95f492", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.5448014058934652, "ground_truth": 0}, {"key": "fd13c81373473f862d0f3559ffbc2a03fa95f492", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.5331543990556957, "ground_truth": 0}, {"key": "fd13c81373473f862d0f3559ffbc2a03fa95f492", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.7341195236940438, "ground_truth": 0}, {"key": "fd13c81373473f862d0f3559ffbc2a03fa95f492", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.5907792030618999, "ground_truth": 0}, {"key": "ad275932d9fb03762cc781e06955fb088e165ad9", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.7745833812320552, "ground_truth": 0}, {"key": "ad275932d9fb03762cc781e06955fb088e165ad9", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.806852613428247, "ground_truth": 0}, {"key": "ad275932d9fb03762cc781e06955fb088e165ad9", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.9433475740775773, "ground_truth": 0}, {"key": "ad275932d9fb03762cc781e06955fb088e165ad9", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.8019358196322607, "ground_truth": 0}, {"key": "ad275932d9fb03762cc781e06955fb088e165ad9", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.7905303262354647, "ground_truth": 0}, {"key": "f9fedde4734d8ac3431c0ed5d338efcd799b1aea", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.8910549588271268, "ground_truth": 0}, {"key": "f9fedde4734d8ac3431c0ed5d338efcd799b1aea", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.7648916206522985, "ground_truth": 0}, {"key": "f9fedde4734d8ac3431c0ed5d338efcd799b1aea", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.8092759807676908, "ground_truth": 0}, {"key": "f9fedde4734d8ac3431c0ed5d338efcd799b1aea", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.7634837557560904, "ground_truth": 0}, {"key": "f9fedde4734d8ac3431c0ed5d338efcd799b1aea", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.7122321896554983, "ground_truth": 0}, {"key": "bbe84a85e38aac4e2cff76da7ce4ed349474db25", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.6791786963520141, "ground_truth": 0}, {"key": "bbe84a85e38aac4e2cff76da7ce4ed349474db25", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.8128673149839195, "ground_truth": 0}, {"key": "bbe84a85e38aac4e2cff76da7ce4ed349474db25", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.5583269725354536, "ground_truth": 0}, {"key": "bbe84a85e38aac4e2cff76da7ce4ed349474db25", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.6842640292708682, "ground_truth": 0}, {"key": "bbe84a85e38aac4e2cff76da7ce4ed349474db25", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.762070098170814, "ground_truth": 0}, {"key": "45884af9aff9abf54fec27f510c3f9ed000fc6e1", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.8128673173255951, "ground_truth": 0}, {"key": "45884af9aff9abf54fec27f510c3f9ed000fc6e1", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.812867316427039, "ground_truth": 0}, {"key": "45884af9aff9abf54fec27f510c3f9ed000fc6e1", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.8056321752349106, "ground_truth": 0}, {"key": "45884af9aff9abf54fec27f510c3f9ed000fc6e1", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.9032942145973444, "ground_truth": 0}, {"key": "45884af9aff9abf54fec27f510c3f9ed000fc6e1", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.887984041454679, "ground_truth": 0}, {"key": "59e60ba3c7ea5f5991db8ed4afd368c69e697dde", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.8714748668472959, "ground_truth": 0}, {"key": "59e60ba3c7ea5f5991db8ed4afd368c69e697dde", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.8568122876809264, "ground_truth": 0}, {"key": "59e60ba3c7ea5f5991db8ed4afd368c69e697dde", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.8962513721115286, "ground_truth": 0}, {"key": "59e60ba3c7ea5f5991db8ed4afd368c69e697dde", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.8587185790271642, "ground_truth": 0}, {"key": "59e60ba3c7ea5f5991db8ed4afd368c69e697dde", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.8558511544893309, "ground_truth": 0}, {"key": "265ad4cbd8cbad94527db327a39c2d8f33db33ce", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.821044100295118, "ground_truth": 0}, {"key": "265ad4cbd8cbad94527db327a39c2d8f33db33ce", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.8164063809915171, "ground_truth": 0}, {"key": "265ad4cbd8cbad94527db327a39c2d8f33db33ce", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.7295197843635424, "ground_truth": 0}, {"key": "265ad4cbd8cbad94527db327a39c2d8f33db33ce", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.7732163674571404, "ground_truth": 0}, {"key": "265ad4cbd8cbad94527db327a39c2d8f33db33ce", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.8244619307124529, "ground_truth": 0}, {"key": "54e68f9b7cdd209c09b2a47feef62b9082346031", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.8902942287623993, "ground_truth": 0}, {"key": "54e68f9b7cdd209c09b2a47feef62b9082346031", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.8714748567547732, "ground_truth": 0}, {"key": "54e68f9b7cdd209c09b2a47feef62b9082346031", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.8449215322004592, "ground_truth": 0}, {"key": "54e68f9b7cdd209c09b2a47feef62b9082346031", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.9124361555672239, "ground_truth": 0}, {"key": "54e68f9b7cdd209c09b2a47feef62b9082346031", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.8791467656236743, "ground_truth": 0}, {"key": "3b5e3dff560e2233e8370c87e9d92461200f8bd4", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.700894818270572, "ground_truth": 0}, {"key": "3b5e3dff560e2233e8370c87e9d92461200f8bd4", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.6791787013329116, "ground_truth": 0}, {"key": "3b5e3dff560e2233e8370c87e9d92461200f8bd4", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.7057850485961102, "ground_truth": 0}, {"key": "3b5e3dff560e2233e8370c87e9d92461200f8bd4", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.7461389718949729, "ground_truth": 0}, {"key": "3b5e3dff560e2233e8370c87e9d92461200f8bd4", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.7745833795485598, "ground_truth": 0}, {"key": "242c51d129c998a2585feee12e109a2058eb7c2b", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.752012559033018, "ground_truth": 0}, {"key": "242c51d129c998a2585feee12e109a2058eb7c2b", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.8976952949392017, "ground_truth": 0}, {"key": "242c51d129c998a2585feee12e109a2058eb7c2b", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.78133062163618, "ground_truth": 0}, {"key": "242c51d129c998a2585feee12e109a2058eb7c2b", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.8459424399044025, "ground_truth": 0}, {"key": "242c51d129c998a2585feee12e109a2058eb7c2b", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.7549149781747829, "ground_truth": 0}, {"key": "5ce92746bc1f4f5cbb25956c1289ffcd7f50f07e", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.7563575806359242, "ground_truth": 0}, {"key": "5ce92746bc1f4f5cbb25956c1289ffcd7f50f07e", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.8998277723188748, "ground_truth": 0}, {"key": "5ce92746bc1f4f5cbb25956c1289ffcd7f50f07e", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.7620701045245973, "ground_truth": 0}, {"key": "5ce92746bc1f4f5cbb25956c1289ffcd7f50f07e", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.6566582600985456, "ground_truth": 0}, {"key": "5ce92746bc1f4f5cbb25956c1289ffcd7f50f07e", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.8438951030166745, "ground_truth": 0}, {"key": "2f32a9eebbfa707a264d82a3bef5557f6b3b5f20", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.8969755730617104, "ground_truth": 0}, {"key": "2f32a9eebbfa707a264d82a3bef5557f6b3b5f20", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.8652240820491653, "ground_truth": 0}, {"key": "2f32a9eebbfa707a264d82a3bef5557f6b3b5f20", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.8962513768479794, "ground_truth": 0}, {"key": "2f32a9eebbfa707a264d82a3bef5557f6b3b5f20", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.855851145098671, "ground_truth": 0}, {"key": "2f32a9eebbfa707a264d82a3bef5557f6b3b5f20", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.8856314753939224, "ground_truth": 0}, {"key": "57a373fa7d17600396fcee99164e79c0edccad14", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.781330620052764, "ground_truth": 0}, {"key": "57a373fa7d17600396fcee99164e79c0edccad14", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.8397339752657407, "ground_truth": 0}, {"key": "57a373fa7d17600396fcee99164e79c0edccad14", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.9190632890264381, "ground_truth": 0}, {"key": "57a373fa7d17600396fcee99164e79c0edccad14", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.8799743717441734, "ground_truth": 0}, {"key": "57a373fa7d17600396fcee99164e79c0edccad14", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.9130583435440309, "ground_truth": 0}, {"key": "9b087c5572cc091c519625d37d1a614b97b8ed30", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.9525741297869759, "ground_truth": 0}, {"key": "9b087c5572cc091c519625d37d1a614b97b8ed30", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.8984105525737066, "ground_truth": 0}, {"key": "9b087c5572cc091c519625d37d1a614b97b8ed30", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.8688267799240028, "ground_truth": 0}, {"key": "9b087c5572cc091c519625d37d1a614b97b8ed30", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.8529354803188699, "ground_truth": 0}, {"key": "9b087c5572cc091c519625d37d1a614b97b8ed30", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.8519528071071192, "ground_truth": 0}, {"key": "b5211115ff68e12e759a474a02d3b163211af563", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.6619228871728288, "ground_truth": 0}, {"key": "b5211115ff68e12e759a474a02d3b163211af563", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.8210441057882036, "ground_truth": 0}, {"key": "b5211115ff68e12e759a474a02d3b163211af563", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.7490871980531162, "ground_truth": 0}, {"key": "b5211115ff68e12e759a474a02d3b163211af563", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.8365545572017825, "ground_truth": 0}, {"key": "b5211115ff68e12e759a474a02d3b163211af563", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.884039287855569, "ground_truth": 0}, {"key": "6b75abea2de5c9c9952af0427ccec78910ac811f", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.8210440966644517, "ground_truth": 0}, {"key": "6b75abea2de5c9c9952af0427ccec78910ac811f", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.7853085808002893, "ground_truth": 0}, {"key": "6b75abea2de5c9c9952af0427ccec78910ac811f", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.8006919841229637, "ground_truth": 0}, {"key": "6b75abea2de5c9c9952af0427ccec78910ac811f", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.8832359980624592, "ground_truth": 0}, {"key": "6b75abea2de5c9c9952af0427ccec78910ac811f", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.8587185874333557, "ground_truth": 0}, {"key": "259cc1db3d4c814dafc02ed071327f65a7b9eaad", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.7041601203399407, "ground_truth": 0}, {"key": "259cc1db3d4c814dafc02ed071327f65a7b9eaad", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.8322366517879288, "ground_truth": 0}, {"key": "259cc1db3d4c814dafc02ed071327f65a7b9eaad", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.6943026692945827, "ground_truth": 0}, {"key": "259cc1db3d4c814dafc02ed071327f65a7b9eaad", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.5544704599591256, "ground_truth": 0}, {"key": "259cc1db3d4c814dafc02ed071327f65a7b9eaad", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.7786493149571352, "ground_truth": 0}, {"key": "3bb1cda1e01cb6e14f6190ced3b1ec3f7ef50de9", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.717011867393342, "ground_truth": 0}, {"key": "3bb1cda1e01cb6e14f6190ced3b1ec3f7ef50de9", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.7057850259443494, "ground_truth": 0}, {"key": "3bb1cda1e01cb6e14f6190ced3b1ec3f7ef50de9", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.7534666480127614, "ground_truth": 0}, {"key": "3bb1cda1e01cb6e14f6190ced3b1ec3f7ef50de9", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.7577943763310415, "ground_truth": 0}, {"key": "3bb1cda1e01cb6e14f6190ced3b1ec3f7ef50de9", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.8140527959753342, "ground_truth": 0}, {"key": "7afbe903f1f7cdc1af509583649babf481d01729", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.7813306245063181, "ground_truth": 0}, {"key": "7afbe903f1f7cdc1af509583649babf481d01729", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.8116760061215136, "ground_truth": 0}, {"key": "7afbe903f1f7cdc1af509583649babf481d01729", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.581303070175198, "ground_truth": 0}, {"key": "7afbe903f1f7cdc1af509583649babf481d01729", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.6893056019281615, "ground_truth": 0}, {"key": "7afbe903f1f7cdc1af509583649babf481d01729", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.7606506591822844, "ground_truth": 0}, {"key": "79d625a3311f4ff11598a3ae4fca63103e84e9a1", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.767689851102805, "ground_truth": 0}, {"key": "79d625a3311f4ff11598a3ae4fca63103e84e9a1", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.78266248565934, "ground_truth": 0}, {"key": "79d625a3311f4ff11598a3ae4fca63103e84e9a1", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.7648916117756649, "ground_truth": 0}, {"key": "79d625a3311f4ff11598a3ae4fca63103e84e9a1", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.6076631904019361, "ground_truth": 0}, {"key": "79d625a3311f4ff11598a3ae4fca63103e84e9a1", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.6460137089800542, "ground_truth": 0}, {"key": "ea6c4267f17d55f1bd9f0950c31ef59565bdc30b", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.7185944232343031, "ground_truth": 0}, {"key": "ea6c4267f17d55f1bd9f0950c31ef59565bdc30b", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.7826624826628603, "ground_truth": 0}, {"key": "ea6c4267f17d55f1bd9f0950c31ef59565bdc30b", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.7634837635381032, "ground_truth": 0}, {"key": "ea6c4267f17d55f1bd9f0950c31ef59565bdc30b", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.861538205866359, "ground_truth": 0}, {"key": "ea6c4267f17d55f1bd9f0950c31ef59565bdc30b", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.694302678610535, "ground_truth": 0}, {"key": "851d02b689bec14607574096bb77b9acf53c15ee", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.853912756149364, "ground_truth": 0}, {"key": "851d02b689bec14607574096bb77b9acf53c15ee", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.8940517194823404, "ground_truth": 0}, {"key": "851d02b689bec14607574096bb77b9acf53c15ee", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.8489721899380217, "ground_truth": 0}, {"key": "851d02b689bec14607574096bb77b9acf53c15ee", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.8104789082566513, "ground_truth": 0}, {"key": "851d02b689bec14607574096bb77b9acf53c15ee", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.789233684706331, "ground_truth": 0}, {"key": "f2d00c8c396698becc18fd2b41ba595c7a3e1cc6", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.9594592624236962, "ground_truth": 0}, {"key": "f2d00c8c396698becc18fd2b41ba595c7a3e1cc6", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.9572778031076519, "ground_truth": 0}, {"key": "f2d00c8c396698becc18fd2b41ba595c7a3e1cc6", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.9706877690553416, "ground_truth": 0}, {"key": "f2d00c8c396698becc18fd2b41ba595c7a3e1cc6", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.9764905474320611, "ground_truth": 0}, {"key": "f2d00c8c396698becc18fd2b41ba595c7a3e1cc6", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.965381160297276, "ground_truth": 0}, {"key": "70c6ca3234f9b1221c8aea7671dd78e1ca9d9139", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.692641985800128, "ground_truth": 0}, {"key": "70c6ca3234f9b1221c8aea7671dd78e1ca9d9139", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.7431679902681861, "ground_truth": 0}, {"key": "70c6ca3234f9b1221c8aea7671dd78e1ca9d9139", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.6976089211931659, "ground_truth": 0}, {"key": "70c6ca3234f9b1221c8aea7671dd78e1ca9d9139", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.7461389828328346, "ground_truth": 0}, {"key": "70c6ca3234f9b1221c8aea7671dd78e1ca9d9139", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.6619228581181021, "ground_truth": 0}, {"key": "86eaa90c419d5ed93341248fecd8c25d820f2b82", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.8902942329092689, "ground_truth": 0}, {"key": "86eaa90c419d5ed93341248fecd8c25d820f2b82", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.9202179883406968, "ground_truth": 0}, {"key": "86eaa90c419d5ed93341248fecd8c25d820f2b82", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.8615382007006046, "ground_truth": 0}, {"key": "86eaa90c419d5ed93341248fecd8c25d820f2b82", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.8791467758606716, "ground_truth": 0}, {"key": "86eaa90c419d5ed93341248fecd8c25d820f2b82", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.8633916009942479, "ground_truth": 0}, {"key": "a1841cf61c53937fffc54c0e81d8f7cfcad2f0c2", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.6723317070553846, "ground_truth": 0}, {"key": "a1841cf61c53937fffc54c0e81d8f7cfcad2f0c2", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.7745833877810181, "ground_truth": 0}, {"key": "a1841cf61c53937fffc54c0e81d8f7cfcad2f0c2", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.8548846489991365, "ground_truth": 0}, {"key": "a1841cf61c53937fffc54c0e81d8f7cfcad2f0c2", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.5175708846480798, "ground_truth": 0}, {"key": "a1841cf61c53937fffc54c0e81d8f7cfcad2f0c2", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.805632178403448, "ground_truth": 0}, {"key": "5d221c86fdadca378eeaabc39c881cc74efcff07", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.6315943031953134, "ground_truth": 0}, {"key": "5d221c86fdadca378eeaabc39c881cc74efcff07", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.7634837748150922, "ground_truth": 0}, {"key": "5d221c86fdadca378eeaabc39c881cc74efcff07", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.6636689487504782, "ground_truth": 0}, {"key": "5d221c86fdadca378eeaabc39c881cc74efcff07", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.5156199250506944, "ground_truth": 0}, {"key": "5d221c86fdadca378eeaabc39c881cc74efcff07", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.8092759739447816, "ground_truth": 0}, {"key": "7a49f5bc1d336309f57076bceba91885ee5368b5", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.9178933682025369, "ground_truth": 0}, {"key": "7a49f5bc1d336309f57076bceba91885ee5368b5", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.9334308122901501, "ground_truth": 0}, {"key": "7a49f5bc1d336309f57076bceba91885ee5368b5", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.8529354768770877, "ground_truth": 0}, {"key": "7a49f5bc1d336309f57076bceba91885ee5368b5", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.9263037233312824, "ground_truth": 0}, {"key": "7a49f5bc1d336309f57076bceba91885ee5368b5", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.9026095998002927, "ground_truth": 0}, {"key": "dd46893fd318dce4e209f9a335612659ebf8fd24", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.7431680168883674, "ground_truth": 0}, {"key": "dd46893fd318dce4e209f9a335612659ebf8fd24", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.8568123130655887, "ground_truth": 0}, {"key": "dd46893fd318dce4e209f9a335612659ebf8fd24", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.7634837596475902, "ground_truth": 0}, {"key": "dd46893fd318dce4e209f9a335612659ebf8fd24", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.7295197802377251, "ground_truth": 0}, {"key": "dd46893fd318dce4e209f9a335612659ebf8fd24", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.8175744847643058, "ground_truth": 0}, {"key": "acda8749fba5e9553e9f47cef89ef85eae5ad4e3", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.7745833783148665, "ground_truth": 0}, {"key": "acda8749fba5e9553e9f47cef89ef85eae5ad4e3", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.7248702716243243, "ground_truth": 0}, {"key": "acda8749fba5e9553e9f47cef89ef85eae5ad4e3", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.7461390028413459, "ground_truth": 0}, {"key": "acda8749fba5e9553e9f47cef89ef85eae5ad4e3", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.7490872349431313, "ground_truth": 0}, {"key": "acda8749fba5e9553e9f47cef89ef85eae5ad4e3", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.8128673045716924, "ground_truth": 0}, {"key": "20b11518df6520f552d691d5f6c0d02755d11809", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.8783142488314191, "ground_truth": 0}, {"key": "20b11518df6520f552d691d5f6c0d02755d11809", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.7943849504105531, "ground_truth": 0}, {"key": "20b11518df6520f552d691d5f6c0d02755d11809", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.8019358296585296, "ground_truth": 0}, {"key": "20b11518df6520f552d691d5f6c0d02755d11809", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.8774767926700302, "ground_truth": 0}, {"key": "20b11518df6520f552d691d5f6c0d02755d11809", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.8044059262960253, "ground_truth": 0}, {"key": "51fe083191bb5568bf6a5fea1610a8e19663d7b2", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.6992544030390644, "ground_truth": 0}, {"key": "51fe083191bb5568bf6a5fea1610a8e19663d7b2", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.9230391602902238, "ground_truth": 0}, {"key": "51fe083191bb5568bf6a5fea1610a8e19663d7b2", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.8344068827416528, "ground_truth": 0}, {"key": "51fe083191bb5568bf6a5fea1610a8e19663d7b2", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.7772998561211693, "ground_truth": 0}, {"key": "51fe083191bb5568bf6a5fea1610a8e19663d7b2", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.8652240829825814, "ground_truth": 0}, {"key": "8af047c2d83a91e8b745adfcaa7c282dfe1030a2", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.5945512498018425, "ground_truth": 0}, {"key": "8af047c2d83a91e8b745adfcaa7c282dfe1030a2", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.924141818337642, "ground_truth": 0}, {"key": "8af047c2d83a91e8b745adfcaa7c282dfe1030a2", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.6723317078180489, "ground_truth": 0}, {"key": "8af047c2d83a91e8b745adfcaa7c282dfe1030a2", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.5621765213666351, "ground_truth": 0}, {"key": "8af047c2d83a91e8b745adfcaa7c282dfe1030a2", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.7505527668138557, "ground_truth": 0}, {"key": "dfcacd955a9168b2cf599c57a539dbfce43ea2a9", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.9073122266558433, "ground_truth": 0}, {"key": "dfcacd955a9168b2cf599c57a539dbfce43ea2a9", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.8643104606840811, "ground_truth": 0}, {"key": "dfcacd955a9168b2cf599c57a539dbfce43ea2a9", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.9032942096494964, "ground_truth": 0}, {"key": "dfcacd955a9168b2cf599c57a539dbfce43ea2a9", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.8509647017008692, "ground_truth": 0}, {"key": "dfcacd955a9168b2cf599c57a539dbfce43ea2a9", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.8991213791888402, "ground_truth": 0}, {"key": "f2463954bc7215d8a1f98cf0d85f280fd2affa58", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.8652240916809852, "ground_truth": 0}, {"key": "f2463954bc7215d8a1f98cf0d85f280fd2affa58", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.7772998607672376, "ground_truth": 0}, {"key": "f2463954bc7215d8a1f98cf0d85f280fd2affa58", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.7994423233953247, "ground_truth": 0}, {"key": "f2463954bc7215d8a1f98cf0d85f280fd2affa58", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.8577681181608844, "ground_truth": 0}, {"key": "f2463954bc7215d8a1f98cf0d85f280fd2affa58", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.8459424460774162, "ground_truth": 0}, {"key": "0e7a92a6f06e94cdd613860d4a3f4b92a06a2b43", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.6169358391562886, "ground_truth": 0}, {"key": "0e7a92a6f06e94cdd613860d4a3f4b92a06a2b43", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.6548947424725813, "ground_truth": 0}, {"key": "0e7a92a6f06e94cdd613860d4a3f4b92a06a2b43", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.709019155997519, "ground_truth": 0}, {"key": "0e7a92a6f06e94cdd613860d4a3f4b92a06a2b43", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.7264255982292436, "ground_truth": 0}, {"key": "0e7a92a6f06e94cdd613860d4a3f4b92a06a2b43", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.8633916105511471, "ground_truth": 0}, {"key": "2905a15c5947042e42f4b52dc201d24822af20f1", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.8397339627751073, "ground_truth": 0}, {"key": "2905a15c5947042e42f4b52dc201d24822af20f1", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.8766343835365846, "ground_truth": 0}, {"key": "2905a15c5947042e42f4b52dc201d24822af20f1", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.8568122907186615, "ground_truth": 0}, {"key": "2905a15c5947042e42f4b52dc201d24822af20f1", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.7892336996589508, "ground_truth": 0}, {"key": "2905a15c5947042e42f4b52dc201d24822af20f1", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.8255897253810802, "ground_truth": 0}, {"key": "808a3d788317af05686ee71a71d2fbc5c19267bc", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.6706082863749722, "ground_truth": 0}, {"key": "808a3d788317af05686ee71a71d2fbc5c19267bc", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.7534666359239235, "ground_truth": 0}, {"key": "808a3d788317af05686ee71a71d2fbc5c19267bc", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.7606506500824458, "ground_truth": 0}, {"key": "808a3d788317af05686ee71a71d2fbc5c19267bc", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.7563575841171324, "ground_truth": 0}, {"key": "808a3d788317af05686ee71a71d2fbc5c19267bc", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.7461389780693524, "ground_truth": 0}, {"key": "5a1bec30205b6938392f3119366e27d15b4849e8", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.8807970831593154, "ground_truth": 0}, {"key": "5a1bec30205b6938392f3119366e27d15b4849e8", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.7931059392420484, "ground_truth": 0}, {"key": "5a1bec30205b6938392f3119366e27d15b4849e8", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.7201714981369222, "ground_truth": 0}, {"key": "5a1bec30205b6938392f3119366e27d15b4849e8", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.8311430500164361, "ground_truth": 0}, {"key": "5a1bec30205b6938392f3119366e27d15b4849e8", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.6706082849778398, "ground_truth": 0}, {"key": "7ff39e1220c0f084434786ed145e15c6abe48def", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.6671476735917088, "ground_truth": 0}, {"key": "7ff39e1220c0f084434786ed145e15c6abe48def", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.8449215207981943, "ground_truth": 0}, {"key": "7ff39e1220c0f084434786ed145e15c6abe48def", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.8519528041079348, "ground_truth": 0}, {"key": "7ff39e1220c0f084434786ed145e15c6abe48def", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.8354835295972587, "ground_truth": 0}, {"key": "7ff39e1220c0f084434786ed145e15c6abe48def", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.8879840409769717, "ground_truth": 0}, {"key": "7551503e7e57bd519913b0df90ca1e80d5305b05", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.8187367888568253, "ground_truth": 0}, {"key": "7551503e7e57bd519913b0df90ca1e80d5305b05", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.8438951163702305, "ground_truth": 0}, {"key": "7551503e7e57bd519913b0df90ca1e80d5305b05", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.9005297874670337, "ground_truth": 0}, {"key": "7551503e7e57bd519913b0df90ca1e80d5305b05", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.838679766344591, "ground_truth": 0}, {"key": "7551503e7e57bd519913b0df90ca1e80d5305b05", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.9196425311583434, "ground_truth": 0}, {"key": "c34a0cbf6db61323766fc86b1b89b399ff6b0666", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.9099070052281779, "ground_truth": 0}, {"key": "c34a0cbf6db61323766fc86b1b89b399ff6b0666", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.8376199763327274, "ground_truth": 0}, {"key": "c34a0cbf6db61323766fc86b1b89b399ff6b0666", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.9012274069155026, "ground_truth": 0}, {"key": "c34a0cbf6db61323766fc86b1b89b399ff6b0666", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.7892336960913058, "ground_truth": 0}, {"key": "c34a0cbf6db61323766fc86b1b89b399ff6b0666", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.7718434953428572, "ground_truth": 0}, {"key": "d07a61368a195444b14bd4b382e0fc3d64890b22", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.7943849505931294, "ground_truth": 0}, {"key": "d07a61368a195444b14bd4b382e0fc3d64890b22", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.6706082836641328, "ground_truth": 0}, {"key": "d07a61368a195444b14bd4b382e0fc3d64890b22", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.7813306223083466, "ground_truth": 0}, {"key": "d07a61368a195444b14bd4b382e0fc3d64890b22", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.8670357532863876, "ground_truth": 0}, {"key": "d07a61368a195444b14bd4b382e0fc3d64890b22", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.8267117858020846, "ground_truth": 0}, {"key": "aa68dee4bc246e5aae9507342f8520a2a301a310", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.8807970887062315, "ground_truth": 0}, {"key": "aa68dee4bc246e5aae9507342f8520a2a301a310", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.865224085557132, "ground_truth": 0}, {"key": "aa68dee4bc246e5aae9507342f8520a2a301a310", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.7931059435221117, "ground_truth": 0}, {"key": "aa68dee4bc246e5aae9507342f8520a2a301a310", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.7534666566422556, "ground_truth": 0}, {"key": "aa68dee4bc246e5aae9507342f8520a2a301a310", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.7718435047501582, "ground_truth": 0}, {"key": "87ef15064035db73cb29f5cec2f0442f2c527ef0", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.8774767956923115, "ground_truth": 0}, {"key": "87ef15064035db73cb29f5cec2f0442f2c527ef0", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.8596637511133528, "ground_truth": 0}, {"key": "87ef15064035db73cb29f5cec2f0442f2c527ef0", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.8438950967204039, "ground_truth": 0}, {"key": "87ef15064035db73cb29f5cec2f0442f2c527ef0", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.8233283806257119, "ground_truth": 0}, {"key": "87ef15064035db73cb29f5cec2f0442f2c527ef0", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.843895111395529, "ground_truth": 0}, {"key": "a577b934e210ef7dce07390711f03db8bb2e005a", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.8006919825285489, "ground_truth": 0}, {"key": "a577b934e210ef7dce07390711f03db8bb2e005a", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.6926419818228998, "ground_truth": 0}, {"key": "a577b934e210ef7dce07390711f03db8bb2e005a", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.6460136995996173, "ground_truth": 0}, {"key": "a577b934e210ef7dce07390711f03db8bb2e005a", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.7549149912247597, "ground_truth": 0}, {"key": "a577b934e210ef7dce07390711f03db8bb2e005a", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.624293518209418, "ground_truth": 0}, {"key": "c9414bf55859cb9ca7e925a4a09b416b6f66446a", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.9815951093056485, "ground_truth": 0}, {"key": "c9414bf55859cb9ca7e925a4a09b416b6f66446a", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.9868787297731318, "ground_truth": 0}, {"key": "c9414bf55859cb9ca7e925a4a09b416b6f66446a", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.9861513902115968, "ground_truth": 0}, {"key": "c9414bf55859cb9ca7e925a4a09b416b6f66446a", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.9651191106945306, "ground_truth": 0}, {"key": "c9414bf55859cb9ca7e925a4a09b416b6f66446a", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.9778834108282332, "ground_truth": 0}, {"key": "f12cda150b96acfa1499b2afb0a81029545abadf", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.908617888124199, "ground_truth": 0}, {"key": "f12cda150b96acfa1499b2afb0a81029545abadf", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.8548846413760404, "ground_truth": 0}, {"key": "f12cda150b96acfa1499b2afb0a81029545abadf", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.9339146244807183, "ground_truth": 0}, {"key": "f12cda150b96acfa1499b2afb0a81029545abadf", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.9511422217798396, "ground_truth": 0}, {"key": "f12cda150b96acfa1499b2afb0a81029545abadf", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.9219218374358192, "ground_truth": 0}, {"key": "7359741b0e60b4402f069963a26c7aa766f45e7c", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.8221891221315257, "ground_truth": 0}, {"key": "7359741b0e60b4402f069963a26c7aa766f45e7c", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.8469578443969369, "ground_truth": 0}, {"key": "7359741b0e60b4402f069963a26c7aa766f45e7c", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.8449215294182746, "ground_truth": 0}, {"key": "7359741b0e60b4402f069963a26c7aa766f45e7c", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.8386797651115195, "ground_truth": 0}, {"key": "7359741b0e60b4402f069963a26c7aa766f45e7c", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.8925625309040057, "ground_truth": 0}, {"key": "b10c71f49dbeabad23325d625e8e7b8529429607", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.9219218365186462, "ground_truth": 0}, {"key": "b10c71f49dbeabad23325d625e8e7b8529429607", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.8568122873888699, "ground_truth": 0}, {"key": "b10c71f49dbeabad23325d625e8e7b8529429607", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.7918210655055286, "ground_truth": 0}, {"key": "b10c71f49dbeabad23325d625e8e7b8529429607", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.8499711819063429, "ground_truth": 0}, {"key": "b10c71f49dbeabad23325d625e8e7b8529429607", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.9161096119398383, "ground_truth": 0}, {"key": "c5a1e04f5f84d406ffedfc2f312c314d1bc03c46", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.7090191285506371, "ground_truth": 0}, {"key": "c5a1e04f5f84d406ffedfc2f312c314d1bc03c46", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.6976089158238966, "ground_truth": 0}, {"key": "c5a1e04f5f84d406ffedfc2f312c314d1bc03c46", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.764891618465086, "ground_truth": 0}, {"key": "c5a1e04f5f84d406ffedfc2f312c314d1bc03c46", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.7217432050300338, "ground_truth": 0}, {"key": "c5a1e04f5f84d406ffedfc2f312c314d1bc03c46", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.5851011764687354, "ground_truth": 0}, {"key": "8a5035d3527c4db4357dd1db9fb2712008dccea9", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.6791786881483621, "ground_truth": 0}, {"key": "8a5035d3527c4db4357dd1db9fb2712008dccea9", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.8152324841041448, "ground_truth": 0}, {"key": "8a5035d3527c4db4357dd1db9fb2712008dccea9", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.6279512034108515, "ground_truth": 0}, {"key": "8a5035d3527c4db4357dd1db9fb2712008dccea9", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.8311430506361667, "ground_truth": 0}, {"key": "8a5035d3527c4db4357dd1db9fb2712008dccea9", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.615087837664108, "ground_truth": 0}, {"key": "3f33d4cb25cd121619ba99eeb02709b72716d622", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.9449947131707093, "ground_truth": 0}, {"key": "3f33d4cb25cd121619ba99eeb02709b72716d622", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.9515039984031942, "ground_truth": 0}, {"key": "3f33d4cb25cd121619ba99eeb02709b72716d622", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.9500414745231932, "ground_truth": 0}, {"key": "3f33d4cb25cd121619ba99eeb02709b72716d622", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.9768465900507703, "ground_truth": 0}, {"key": "3f33d4cb25cd121619ba99eeb02709b72716d622", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.9543079666512592, "ground_truth": 0}, {"key": "e6f451d6667f142a64818a9d05dbc49115e7cbf9", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.9390248186879548, "ground_truth": 0}, {"key": "e6f451d6667f142a64818a9d05dbc49115e7cbf9", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.9719924804353431, "ground_truth": 0}, {"key": "e6f451d6667f142a64818a9d05dbc49115e7cbf9", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.9473810469200697, "ground_truth": 0}, {"key": "e6f451d6667f142a64818a9d05dbc49115e7cbf9", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.9362850085377219, "ground_truth": 0}, {"key": "e6f451d6667f142a64818a9d05dbc49115e7cbf9", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.9309620707367338, "ground_truth": 0}, {"key": "39622c01625247af942a6439699ff529db1d54d0", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.6791787040443369, "ground_truth": 0}, {"key": "39622c01625247af942a6439699ff529db1d54d0", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.5253688037887858, "ground_truth": 0}, {"key": "39622c01625247af942a6439699ff529db1d54d0", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.5813030770288424, "ground_truth": 0}, {"key": "39622c01625247af942a6439699ff529db1d54d0", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.640635844456326, "ground_truth": 0}, {"key": "39622c01625247af942a6439699ff529db1d54d0", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.5506073617613401, "ground_truth": 0}, {"key": "02927c88776bcc84fc883435a5037b4c8ca70e83", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.8757869904881402, "ground_truth": 0}, {"key": "02927c88776bcc84fc883435a5037b4c8ca70e83", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.8311430407684574, "ground_truth": 0}, {"key": "02927c88776bcc84fc883435a5037b4c8ca70e83", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.763483756242003, "ground_truth": 0}, {"key": "02927c88776bcc84fc883435a5037b4c8ca70e83", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.9309620752496831, "ground_truth": 0}, {"key": "02927c88776bcc84fc883435a5037b4c8ca70e83", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.87147487547323, "ground_truth": 0}, {"key": "3ee31d8987c07ba4ea9423d39c5e333525316958", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.8984105527927402, "ground_truth": 0}, {"key": "3ee31d8987c07ba4ea9423d39c5e333525316958", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.9381240143152726, "ground_truth": 0}, {"key": "3ee31d8987c07ba4ea9423d39c5e333525316958", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.9504109753196229, "ground_truth": 0}, {"key": "3ee31d8987c07ba4ea9423d39c5e333525316958", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.9433475729522237, "ground_truth": 0}, {"key": "3ee31d8987c07ba4ea9423d39c5e333525316958", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.9569571507763529, "ground_truth": 0}, {"key": "f8ddc6d36f378757d27a244529f8fe11672baa41", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.5175708933866409, "ground_truth": 0}, {"key": "f8ddc6d36f378757d27a244529f8fe11672baa41", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.8438951085696329, "ground_truth": 0}, {"key": "f8ddc6d36f378757d27a244529f8fe11672baa41", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.661922865343857, "ground_truth": 0}, {"key": "f8ddc6d36f378757d27a244529f8fe11672baa41", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.7279754475388152, "ground_truth": 0}, {"key": "f8ddc6d36f378757d27a244529f8fe11672baa41", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.8056321904765628, "ground_truth": 0}, {"key": "4e97228ceef1be54ab9151fc6759017e6a54a18d", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.6619228945652819, "ground_truth": 0}, {"key": "4e97228ceef1be54ab9151fc6759017e6a54a18d", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.7956581061653296, "ground_truth": 0}, {"key": "4e97228ceef1be54ab9151fc6759017e6a54a18d", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.7718435181117261, "ground_truth": 0}, {"key": "4e97228ceef1be54ab9151fc6759017e6a54a18d", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.8940517162384684, "ground_truth": 0}, {"key": "4e97228ceef1be54ab9151fc6759017e6a54a18d", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.7839884454982946, "ground_truth": 0}, {"key": "0e649ccabaf0e650e9757ee256c2749d37486ba6", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.8267117996193065, "ground_truth": 0}, {"key": "0e649ccabaf0e650e9757ee256c2749d37486ba6", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.8080672156472124, "ground_truth": 0}, {"key": "0e649ccabaf0e650e9757ee256c2749d37486ba6", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.7233094861413433, "ground_truth": 0}, {"key": "0e649ccabaf0e650e9757ee256c2749d37486ba6", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.6442251051965787, "ground_truth": 0}, {"key": "0e649ccabaf0e650e9757ee256c2749d37486ba6", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.7090191431114236, "ground_truth": 0}, {"key": "9eccfcc231c7c0d65cb0c333cb3d1731a5fe2f3f", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.7879311884793844, "ground_truth": 0}, {"key": "9eccfcc231c7c0d65cb0c333cb3d1731a5fe2f3f", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.8428631458849583, "ground_truth": 0}, {"key": "9eccfcc231c7c0d65cb0c333cb3d1731a5fe2f3f", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.8568122899522763, "ground_truth": 0}, {"key": "9eccfcc231c7c0d65cb0c333cb3d1731a5fe2f3f", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.7905302965120654, "ground_truth": 0}, {"key": "9eccfcc231c7c0d65cb0c333cb3d1731a5fe2f3f", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.8397339631841316, "ground_truth": 0}, {"key": "ddf109b3de6022a4ecd62ee2cd31d2c2ac51035b", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.8300437675051275, "ground_truth": 0}, {"key": "ddf109b3de6022a4ecd62ee2cd31d2c2ac51035b", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.8267117929478963, "ground_truth": 0}, {"key": "ddf109b3de6022a4ecd62ee2cd31d2c2ac51035b", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.8267118000100065, "ground_truth": 0}, {"key": "ddf109b3de6022a4ecd62ee2cd31d2c2ac51035b", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.622459315290359, "ground_truth": 0}, {"key": "ddf109b3de6022a4ecd62ee2cd31d2c2ac51035b", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.6424324823371131, "ground_truth": 0}, {"key": "bd92eab23374d95ac4430e2e1a8bf7561c662309", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.9026096009977012, "ground_truth": 0}, {"key": "bd92eab23374d95ac4430e2e1a8bf7561c662309", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.9385759620852164, "ground_truth": 0}, {"key": "bd92eab23374d95ac4430e2e1a8bf7561c662309", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.8783142503299857, "ground_truth": 0}, {"key": "bd92eab23374d95ac4430e2e1a8bf7561c662309", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.9268352806081571, "ground_truth": 0}, {"key": "bd92eab23374d95ac4430e2e1a8bf7561c662309", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.8791467662469367, "ground_truth": 0}, {"key": "d84440effc748f9220c7dde068962e803f566bc7", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.8615382221979436, "ground_truth": 0}, {"key": "d84440effc748f9220c7dde068962e803f566bc7", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.8128673110701624, "ground_truth": 0}, {"key": "d84440effc748f9220c7dde068962e803f566bc7", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.9437636538320007, "ground_truth": 0}, {"key": "d84440effc748f9220c7dde068962e803f566bc7", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.9099070132247935, "ground_truth": 0}, {"key": "d84440effc748f9220c7dde068962e803f566bc7", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.7759445745440022, "ground_truth": 0}, {"key": "e2866f596c85b0191ce812260d23855c70a01192", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.7170118711375365, "ground_truth": 0}, {"key": "e2866f596c85b0191ce812260d23855c70a01192", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.8887587840424637, "ground_truth": 0}, {"key": "e2866f596c85b0191ce812260d23855c70a01192", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.7476159525793755, "ground_truth": 0}, {"key": "e2866f596c85b0191ce812260d23855c70a01192", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.8080672019648735, "ground_truth": 0}, {"key": "e2866f596c85b0191ce812260d23855c70a01192", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.7606506598623598, "ground_truth": 0}, {"key": "4ebd9195bc8c12272b6281a5a610a7b5fb49b8cd", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.8879840482897275, "ground_truth": 0}, {"key": "4ebd9195bc8c12272b6281a5a610a7b5fb49b8cd", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.8947894681183822, "ground_truth": 0}, {"key": "4ebd9195bc8c12272b6281a5a610a7b5fb49b8cd", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.9019206758522503, "ground_truth": 0}, {"key": "4ebd9195bc8c12272b6281a5a610a7b5fb49b8cd", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.8418256416427536, "ground_truth": 0}, {"key": "4ebd9195bc8c12272b6281a5a610a7b5fb49b8cd", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.782662485072886, "ground_truth": 0}, {"key": "4bd37aa7004cd1fdf1ccb506d2159a2cf26995e0", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.8175744811281891, "ground_truth": 0}, {"key": "4bd37aa7004cd1fdf1ccb506d2159a2cf26995e0", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.8910549588711992, "ground_truth": 0}, {"key": "4bd37aa7004cd1fdf1ccb506d2159a2cf26995e0", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.8933094024046162, "ground_truth": 0}, {"key": "4bd37aa7004cd1fdf1ccb506d2159a2cf26995e0", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.8080672141461378, "ground_truth": 0}, {"key": "4bd37aa7004cd1fdf1ccb506d2159a2cf26995e0", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.8879840432950282, "ground_truth": 0}, {"key": "29b87dc549b8c64b35517e684e79b1da6316bd88", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.7154239942199005, "ground_truth": 0}, {"key": "29b87dc549b8c64b35517e684e79b1da6316bd88", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.7620701035731133, "ground_truth": 0}, {"key": "29b87dc549b8c64b35517e684e79b1da6316bd88", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.891811047237993, "ground_truth": 0}, {"key": "29b87dc549b8c64b35517e684e79b1da6316bd88", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.7879311939629052, "ground_truth": 0}, {"key": "29b87dc549b8c64b35517e684e79b1da6316bd88", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.8006919808752145, "ground_truth": 0}, {"key": "d2f2fe0b8797b416bae71305c9d1c874e2fdd0cc", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.6757646070388941, "ground_truth": 0}, {"key": "d2f2fe0b8797b416bae71305c9d1c874e2fdd0cc", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.7718435004635131, "ground_truth": 0}, {"key": "d2f2fe0b8797b416bae71305c9d1c874e2fdd0cc", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.7325918407129115, "ground_truth": 0}, {"key": "d2f2fe0b8797b416bae71305c9d1c874e2fdd0cc", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.7745833849718436, "ground_truth": 0}, {"key": "d2f2fe0b8797b416bae71305c9d1c874e2fdd0cc", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.7786493090398875, "ground_truth": 0}, {"key": "0269d39abbea3edadd225fa97d818f5a789b4c72", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.8068526321079639, "ground_truth": 0}, {"key": "0269d39abbea3edadd225fa97d818f5a789b4c72", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.8267117929478963, "ground_truth": 0}, {"key": "0269d39abbea3edadd225fa97d818f5a789b4c72", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.7431679913363787, "ground_truth": 0}, {"key": "0269d39abbea3edadd225fa97d818f5a789b4c72", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.6943026779510203, "ground_truth": 0}, {"key": "0269d39abbea3edadd225fa97d818f5a789b4c72", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.794384953878808, "ground_truth": 0}, {"key": "394f20c9bee9bc8d0e6a65bac48de57bd9f4733d", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.8397339701239978, "ground_truth": 0}, {"key": "394f20c9bee9bc8d0e6a65bac48de57bd9f4733d", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.7853085708620031, "ground_truth": 0}, {"key": "394f20c9bee9bc8d0e6a65bac48de57bd9f4733d", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.7154239854030734, "ground_truth": 0}, {"key": "394f20c9bee9bc8d0e6a65bac48de57bd9f4733d", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.7122321769650513, "ground_truth": 0}, {"key": "394f20c9bee9bc8d0e6a65bac48de57bd9f4733d", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.8984105561754191, "ground_truth": 0}, {"key": "6e63c8b1ae01ab91b4832222edaf4bb461b6c568", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.7759445367780883, "ground_truth": 0}, {"key": "6e63c8b1ae01ab91b4832222edaf4bb461b6c568", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.8887587809439268, "ground_truth": 0}, {"key": "6e63c8b1ae01ab91b4832222edaf4bb461b6c568", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.8428631459624317, "ground_truth": 0}, {"key": "6e63c8b1ae01ab91b4832222edaf4bb461b6c568", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.8661325080667253, "ground_truth": 0}, {"key": "6e63c8b1ae01ab91b4832222edaf4bb461b6c568", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.7505527790268383, "ground_truth": 0}, {"key": "355875856932fd634aaf7c6b26155403aaf15904", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.9367494741517756, "ground_truth": 0}, {"key": "355875856932fd634aaf7c6b26155403aaf15904", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.9136765211652138, "ground_truth": 0}, {"key": "355875856932fd634aaf7c6b26155403aaf15904", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.9477691433745685, "ground_truth": 0}, {"key": "355875856932fd634aaf7c6b26155403aaf15904", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.9348724559758208, "ground_truth": 0}, {"key": "355875856932fd634aaf7c6b26155403aaf15904", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.9263037272699787, "ground_truth": 0}, {"key": "999523913d281ab57977d79b644f3879ac4d2e37", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.6992544159409663, "ground_truth": 0}, {"key": "999523913d281ab57977d79b644f3879ac4d2e37", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.7577943605381299, "ground_truth": 0}, {"key": "999523913d281ab57977d79b644f3879ac4d2e37", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.667147664395263, "ground_truth": 0}, {"key": "999523913d281ab57977d79b644f3879ac4d2e37", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.7185943822006546, "ground_truth": 0}, {"key": "999523913d281ab57977d79b644f3879ac4d2e37", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.6460136982471015, "ground_truth": 0}, {"key": "5f7424604ec11358dc6fdfa47732f90422949041", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.5926665937195662, "ground_truth": 0}, {"key": "5f7424604ec11358dc6fdfa47732f90422949041", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.586996421298455, "ground_truth": 0}, {"key": "5f7424604ec11358dc6fdfa47732f90422949041", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.6926419768209052, "ground_truth": 0}, {"key": "5f7424604ec11358dc6fdfa47732f90422949041", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.6206215978841755, "ground_truth": 0}, {"key": "5f7424604ec11358dc6fdfa47732f90422949041", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.6513548448839107, "ground_truth": 0}, {"key": "fdb2b65b9cb99b7d52559ae647cae293cb5910d3", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.8210441108072005, "ground_truth": 0}, {"key": "fdb2b65b9cb99b7d52559ae647cae293cb5910d3", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.7008947993663988, "ground_truth": 0}, {"key": "fdb2b65b9cb99b7d52559ae647cae293cb5910d3", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.8479677468416553, "ground_truth": 0}, {"key": "fdb2b65b9cb99b7d52559ae647cae293cb5910d3", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.5409238861713814, "ground_truth": 0}, {"key": "fdb2b65b9cb99b7d52559ae647cae293cb5910d3", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.7745833873146507, "ground_truth": 0}, {"key": "f974fe1b3777ffc5756322c0bb3f31a9b23ec09a", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.8489722007814962, "ground_truth": 0}, {"key": "f974fe1b3777ffc5756322c0bb3f31a9b23ec09a", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.6976089161602197, "ground_truth": 0}, {"key": "f974fe1b3777ffc5756322c0bb3f31a9b23ec09a", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.8116760094078594, "ground_truth": 0}, {"key": "f974fe1b3777ffc5756322c0bb3f31a9b23ec09a", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.6959583245189227, "ground_truth": 0}, {"key": "f974fe1b3777ffc5756322c0bb3f31a9b23ec09a", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.7090191417909208, "ground_truth": 0}, {"key": "2930e1a7ac24bce649bfbf5f5971e74515e38a0a", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.7154239973463554, "ground_truth": 0}, {"key": "2930e1a7ac24bce649bfbf5f5971e74515e38a0a", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.8140527909751734, "ground_truth": 0}, {"key": "2930e1a7ac24bce649bfbf5f5971e74515e38a0a", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.8577681037602715, "ground_truth": 0}, {"key": "2930e1a7ac24bce649bfbf5f5971e74515e38a0a", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.9026095937589013, "ground_truth": 0}, {"key": "2930e1a7ac24bce649bfbf5f5971e74515e38a0a", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.8140527960241111, "ground_truth": 0}, {"key": "f5f7571a69e96c1d288d939861b7216c2bdc0ae4", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.794384954958668, "ground_truth": 0}, {"key": "f5f7571a69e96c1d288d939861b7216c2bdc0ae4", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.8529354782139029, "ground_truth": 0}, {"key": "f5f7571a69e96c1d288d939861b7216c2bdc0ae4", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.7759445249887136, "ground_truth": 0}, {"key": "f5f7571a69e96c1d288d939861b7216c2bdc0ae4", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.8300437567738074, "ground_truth": 0}, {"key": "f5f7571a69e96c1d288d939861b7216c2bdc0ae4", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.833324600755123, "ground_truth": 0}, {"key": "5f02aa32bd1dc95e47355755398e31550b232f8a", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.8887587890960159, "ground_truth": 0}, {"key": "5f02aa32bd1dc95e47355755398e31550b232f8a", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.8092759741203631, "ground_truth": 0}, {"key": "5f02aa32bd1dc95e47355755398e31550b232f8a", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.7620701107612405, "ground_truth": 0}, {"key": "5f02aa32bd1dc95e47355755398e31550b232f8a", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.7813306350891827, "ground_truth": 0}, {"key": "5f02aa32bd1dc95e47355755398e31550b232f8a", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.8887587799168191, "ground_truth": 0}, {"key": "9177e5ac94f038749e8d4eb526a65461e0f6df4c", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.7879311847317142, "ground_truth": 0}, {"key": "9177e5ac94f038749e8d4eb526a65461e0f6df4c", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.7431680066138986, "ground_truth": 0}, {"key": "9177e5ac94f038749e8d4eb526a65461e0f6df4c", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.6740504712017769, "ground_truth": 0}, {"key": "9177e5ac94f038749e8d4eb526a65461e0f6df4c", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.7866228328292476, "ground_truth": 0}, {"key": "9177e5ac94f038749e8d4eb526a65461e0f6df4c", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.8140528034584297, "ground_truth": 0}, {"key": "f12e4bbb07211de7d43b4e331dc73404aa804562", "model": "xsum_readability_ft_llama", "target_model": "llama", "recognition_score": 0.9683812326251908, "ground_truth": 0}, {"key": "f12e4bbb07211de7d43b4e331dc73404aa804562", "model": "xsum_readability_ft_llama", "target_model": "human", "recognition_score": 0.9648551539988958, "ground_truth": 0}, {"key": "f12e4bbb07211de7d43b4e331dc73404aa804562", "model": "xsum_readability_ft_llama", "target_model": "claude", "recognition_score": 0.9807288622592382, "ground_truth": 0}, {"key": "f12e4bbb07211de7d43b4e331dc73404aa804562", "model": "xsum_readability_ft_llama", "target_model": "gpt4", "recognition_score": 0.9844563522652491, "ground_truth": 0}, {"key": "f12e4bbb07211de7d43b4e331dc73404aa804562", "model": "xsum_readability_ft_llama", "target_model": "gpt35", "recognition_score": 0.9906599757652189, "ground_truth": 0}]