[{"key": "42c027e4ff9730fbb3de84c1af0d2c506e41c3e4", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.8856314815737962, "ground_truth": 0}, {"key": "42c027e4ff9730fbb3de84c1af0d2c506e41c3e4", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.8198933292889462, "ground_truth": 0}, {"key": "42c027e4ff9730fbb3de84c1af0d2c506e41c3e4", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.8244619254317274, "ground_truth": 0}, {"key": "42c027e4ff9730fbb3de84c1af0d2c506e41c3e4", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.80317379810002, "ground_truth": 0}, {"key": "42c027e4ff9730fbb3de84c1af0d2c506e41c3e4", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.8955226729523708, "ground_truth": 0}, {"key": "ee8871b15c50d0db17b0179a6d2beab35065f1e9", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.8365545694797739, "ground_truth": 0}, {"key": "ee8871b15c50d0db17b0179a6d2beab35065f1e9", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.8333245903501442, "ground_truth": 0}, {"key": "ee8871b15c50d0db17b0179a6d2beab35065f1e9", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.9136765213013656, "ground_truth": 0}, {"key": "ee8871b15c50d0db17b0179a6d2beab35065f1e9", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.9111797072322867, "ground_truth": 0}, {"key": "ee8871b15c50d0db17b0179a6d2beab35065f1e9", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.8902942292971501, "ground_truth": 0}, {"key": "06352019a19ae31e527f37f7571c6dd7f0c5da37", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.8606036166759766, "ground_truth": 0}, {"key": "06352019a19ae31e527f37f7571c6dd7f0c5da37", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.883235993097269, "ground_truth": 0}, {"key": "06352019a19ae31e527f37f7571c6dd7f0c5da37", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.8418256478442669, "ground_truth": 0}, {"key": "06352019a19ae31e527f37f7571c6dd7f0c5da37", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.8164063714541142, "ground_truth": 0}, {"key": "06352019a19ae31e527f37f7571c6dd7f0c5da37", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.806852619763049, "ground_truth": 0}, {"key": "24521a2abb2e1f5e34e6824e0f9e56904a2b0e88", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.8757869895717668, "ground_truth": 0}, {"key": "24521a2abb2e1f5e34e6824e0f9e56904a2b0e88", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.9241418180856666, "ground_truth": 0}, {"key": "24521a2abb2e1f5e34e6824e0f9e56904a2b0e88", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.8187367921785298, "ground_truth": 0}, {"key": "24521a2abb2e1f5e34e6824e0f9e56904a2b0e88", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.8539127566310596, "ground_truth": 0}, {"key": "24521a2abb2e1f5e34e6824e0f9e56904a2b0e88", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.9309620696690846, "ground_truth": 0}, {"key": "7fe70cc8b12fab2d0a258fababf7d9c6b5e1262a", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.9358173554620894, "ground_truth": 0}, {"key": "7fe70cc8b12fab2d0a258fababf7d9c6b5e1262a", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.9518632274753666, "ground_truth": 0}, {"key": "7fe70cc8b12fab2d0a258fababf7d9c6b5e1262a", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.9532750412920776, "ground_truth": 0}, {"key": "7fe70cc8b12fab2d0a258fababf7d9c6b5e1262a", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.9732407165760631, "ground_truth": 0}, {"key": "7fe70cc8b12fab2d0a258fababf7d9c6b5e1262a", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.9543079673993512, "ground_truth": 0}, {"key": "a1ebb8bb4d370a1fdf28769206d572be60642d70", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.879146762842401, "ground_truth": 0}, {"key": "a1ebb8bb4d370a1fdf28769206d572be60642d70", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.9046505334252417, "ground_truth": 0}, {"key": "a1ebb8bb4d370a1fdf28769206d572be60642d70", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.905322296435672, "ground_truth": 0}, {"key": "a1ebb8bb4d370a1fdf28769206d572be60642d70", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.8080672088010283, "ground_truth": 0}, {"key": "a1ebb8bb4d370a1fdf28769206d572be60642d70", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.8757869858467859, "ground_truth": 0}, {"key": "7c0e61ac829a3b3b653e2e3e7536cc4881d1f264", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.6352224292154242, "ground_truth": 0}, {"key": "7c0e61ac829a3b3b653e2e3e7536cc4881d1f264", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.6859494363515315, "ground_truth": 0}, {"key": "7c0e61ac829a3b3b653e2e3e7536cc4881d1f264", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.8164063663447882, "ground_truth": 0}, {"key": "7c0e61ac829a3b3b653e2e3e7536cc4881d1f264", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.7090191412430045, "ground_truth": 0}, {"key": "7c0e61ac829a3b3b653e2e3e7536cc4881d1f264", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.7122321834684293, "ground_truth": 0}, {"key": "f0d73bdab711763e745cdc75850861c9018f235d", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.8783142547681065, "ground_truth": 0}, {"key": "f0d73bdab711763e745cdc75850861c9018f235d", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.810478915029165, "ground_truth": 0}, {"key": "f0d73bdab711763e745cdc75850861c9018f235d", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.8140528085630732, "ground_truth": 0}, {"key": "f0d73bdab711763e745cdc75850861c9018f235d", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.8300437591795394, "ground_truth": 0}, {"key": "f0d73bdab711763e745cdc75850861c9018f235d", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.8068526398922512, "ground_truth": 0}, {"key": "5e22bbfc7232418b8d2dd646b952e404df5bd048", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.9155072461954609, "ground_truth": 0}, {"key": "5e22bbfc7232418b8d2dd646b952e404df5bd048", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.8824278626451363, "ground_truth": 0}, {"key": "5e22bbfc7232418b8d2dd646b952e404df5bd048", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.8732148300101088, "ground_truth": 0}, {"key": "5e22bbfc7232418b8d2dd646b952e404df5bd048", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.9124361574285016, "ground_truth": 0}, {"key": "5e22bbfc7232418b8d2dd646b952e404df5bd048", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.9019206717035481, "ground_truth": 0}, {"key": "613d6311ec2c1985bd44707d1796d275452fe156", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.741674009030158, "ground_truth": 0}, {"key": "613d6311ec2c1985bd44707d1796d275452fe156", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.8489721993044317, "ground_truth": 0}, {"key": "613d6311ec2c1985bd44707d1796d275452fe156", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.834406892828796, "ground_truth": 0}, {"key": "613d6311ec2c1985bd44707d1796d275452fe156", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.6757646157837687, "ground_truth": 0}, {"key": "613d6311ec2c1985bd44707d1796d275452fe156", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.8289388095435263, "ground_truth": 0}, {"key": "017d27d00eb43678c15cb4a8dd4723a035323219", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.8679338566730825, "ground_truth": 0}, {"key": "017d27d00eb43678c15cb4a8dd4723a035323219", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.8714748713389745, "ground_truth": 0}, {"key": "017d27d00eb43678c15cb4a8dd4723a035323219", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.9066531238295128, "ground_truth": 0}, {"key": "017d27d00eb43678c15cb4a8dd4723a035323219", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.9012274023568159, "ground_truth": 0}, {"key": "017d27d00eb43678c15cb4a8dd4723a035323219", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.9190632873363302, "ground_truth": 0}, {"key": "85f55a3e0dd672857aaaaa80954934a57b7a2fbf", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.8198933319175952, "ground_truth": 0}, {"key": "85f55a3e0dd672857aaaaa80954934a57b7a2fbf", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.8783142487652612, "ground_truth": 0}, {"key": "85f55a3e0dd672857aaaaa80954934a57b7a2fbf", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.93534650831818, "ground_truth": 0}, {"key": "85f55a3e0dd672857aaaaa80954934a57b7a2fbf", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.8991213802792482, "ground_truth": 0}, {"key": "85f55a3e0dd672857aaaaa80954934a57b7a2fbf", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.7401743467165242, "ground_truth": 0}, {"key": "77d7c8cf2a9432e395d629371a12790c563c19f7", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.9124361582557331, "ground_truth": 0}, {"key": "77d7c8cf2a9432e395d629371a12790c563c19f7", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.8791467765870892, "ground_truth": 0}, {"key": "77d7c8cf2a9432e395d629371a12790c563c19f7", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.8606036278796624, "ground_truth": 0}, {"key": "77d7c8cf2a9432e395d629371a12790c563c19f7", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.8757869832242436, "ground_truth": 0}, {"key": "77d7c8cf2a9432e395d629371a12790c563c19f7", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.9032942016727149, "ground_truth": 0}, {"key": "35f0e33de7923036a97ac245d899f990bda5e242", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.8864204147192714, "ground_truth": 0}, {"key": "35f0e33de7923036a97ac245d899f990bda5e242", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.8459424429238757, "ground_truth": 0}, {"key": "35f0e33de7923036a97ac245d899f990bda5e242", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.8519528016095347, "ground_truth": 0}, {"key": "35f0e33de7923036a97ac245d899f990bda5e242", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.9136765175656156, "ground_truth": 0}, {"key": "35f0e33de7923036a97ac245d899f990bda5e242", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.8068526089321313, "ground_truth": 0}, {"key": "2ad31cae96512af5105b9b23f9b681dc732b2605", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.8104789233414501, "ground_truth": 0}, {"key": "2ad31cae96512af5105b9b23f9b681dc732b2605", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.8469578552444498, "ground_truth": 0}, {"key": "2ad31cae96512af5105b9b23f9b681dc732b2605", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.8740772397251398, "ground_truth": 0}, {"key": "2ad31cae96512af5105b9b23f9b681dc732b2605", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.8624675389436872, "ground_truth": 0}, {"key": "2ad31cae96512af5105b9b23f9b681dc732b2605", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.7431680025091844, "ground_truth": 0}, {"key": "0d43b97000ff852282c89d8d105e41495c0ee9bd", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.9005297902452917, "ground_truth": 0}, {"key": "0d43b97000ff852282c89d8d105e41495c0ee9bd", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.9289263307618331, "ground_truth": 0}, {"key": "0d43b97000ff852282c89d8d105e41495c0ee9bd", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.8661325087468869, "ground_truth": 0}, {"key": "0d43b97000ff852282c89d8d105e41495c0ee9bd", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.9257686360576128, "ground_truth": 0}, {"key": "0d43b97000ff852282c89d8d105e41495c0ee9bd", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.947769145604637, "ground_truth": 0}, {"key": "bf0cd4ccacd4fe045995338f4c44d9cf18000226", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.7879311986962821, "ground_truth": 0}, {"key": "bf0cd4ccacd4fe045995338f4c44d9cf18000226", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.7799929104561552, "ground_truth": 0}, {"key": "bf0cd4ccacd4fe045995338f4c44d9cf18000226", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.843895097885138, "ground_truth": 0}, {"key": "bf0cd4ccacd4fe045995338f4c44d9cf18000226", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.828938811142159, "ground_truth": 0}, {"key": "bf0cd4ccacd4fe045995338f4c44d9cf18000226", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.7563575696627137, "ground_truth": 0}, {"key": "2f43e9dfaa43ffbddbce339a8b6403ddce43b38a", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.7041601438431148, "ground_truth": 0}, {"key": "2f43e9dfaa43ffbddbce339a8b6403ddce43b38a", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.8300437670264038, "ground_truth": 0}, {"key": "2f43e9dfaa43ffbddbce339a8b6403ddce43b38a", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.8354835592237094, "ground_truth": 0}, {"key": "2f43e9dfaa43ffbddbce339a8b6403ddce43b38a", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.819893335562008, "ground_truth": 0}, {"key": "2f43e9dfaa43ffbddbce339a8b6403ddce43b38a", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.7759445504186896, "ground_truth": 0}, {"key": "eb68bc51ed4fc727a1af058192a3fef0916c91e7", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.8499711816692882, "ground_truth": 0}, {"key": "eb68bc51ed4fc727a1af058192a3fef0916c91e7", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.8757869870757349, "ground_truth": 0}, {"key": "eb68bc51ed4fc727a1af058192a3fef0916c91e7", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.9273632939158121, "ground_truth": 0}, {"key": "eb68bc51ed4fc727a1af058192a3fef0916c91e7", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.8539127523057903, "ground_truth": 0}, {"key": "eb68bc51ed4fc727a1af058192a3fef0916c91e7", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.8267117972615522, "ground_truth": 0}, {"key": "ad021a7924ee57491cee8576499ac196b1afeb23", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.6424324790034869, "ground_truth": 0}, {"key": "ad021a7924ee57491cee8576499ac196b1afeb23", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.8044059033233434, "ground_truth": 0}, {"key": "ad021a7924ee57491cee8576499ac196b1afeb23", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.8031737913780757, "ground_truth": 0}, {"key": "ad021a7924ee57491cee8576499ac196b1afeb23", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.7534666648812609, "ground_truth": 0}, {"key": "ad021a7924ee57491cee8576499ac196b1afeb23", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.6531269328509727, "ground_truth": 0}, {"key": "9d7fc7fd9ffbfecb1c458b9929fa02e6c3538368", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.9196425299082291, "ground_truth": 0}, {"key": "9d7fc7fd9ffbfecb1c458b9929fa02e6c3538368", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.9026096026036604, "ground_truth": 0}, {"key": "9d7fc7fd9ffbfecb1c458b9929fa02e6c3538368", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.8633916012636873, "ground_truth": 0}, {"key": "9d7fc7fd9ffbfecb1c458b9929fa02e6c3538368", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.9142907231850845, "ground_truth": 0}, {"key": "9d7fc7fd9ffbfecb1c458b9929fa02e6c3538368", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.9257686327120654, "ground_truth": 0}, {"key": "30cb674030b01014d2c87b92f09152857e249631", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.767689850518166, "ground_truth": 0}, {"key": "30cb674030b01014d2c87b92f09152857e249631", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.8499711692153101, "ground_truth": 0}, {"key": "30cb674030b01014d2c87b92f09152857e249631", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.7676898553726881, "ground_truth": 0}, {"key": "30cb674030b01014d2c87b92f09152857e249631", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.7620701140217143, "ground_truth": 0}, {"key": "30cb674030b01014d2c87b92f09152857e249631", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.8807970871713948, "ground_truth": 0}, {"key": "d41dc7fc05273a37f0aceaf4f3e35a187f12653e", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.9026096033628546, "ground_truth": 0}, {"key": "d41dc7fc05273a37f0aceaf4f3e35a187f12653e", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.8558511485596386, "ground_truth": 0}, {"key": "d41dc7fc05273a37f0aceaf4f3e35a187f12653e", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.8365545675337216, "ground_truth": 0}, {"key": "d41dc7fc05273a37f0aceaf4f3e35a187f12653e", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.7634837692686606, "ground_truth": 0}, {"key": "d41dc7fc05273a37f0aceaf4f3e35a187f12653e", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.860603618840585, "ground_truth": 0}, {"key": "fbc6a4d0697b2a3e8b549dcb1f80a8ce7bf47e34", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.8984105484043816, "ground_truth": 0}, {"key": "fbc6a4d0697b2a3e8b549dcb1f80a8ce7bf47e34", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.8670357705133553, "ground_truth": 0}, {"key": "fbc6a4d0697b2a3e8b549dcb1f80a8ce7bf47e34", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.8449215296532119, "ground_truth": 0}, {"key": "fbc6a4d0697b2a3e8b549dcb1f80a8ce7bf47e34", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.8449215348959729, "ground_truth": 0}, {"key": "fbc6a4d0697b2a3e8b549dcb1f80a8ce7bf47e34", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.8210441099885968, "ground_truth": 0}, {"key": "0753a471e6908c35bcbc2daa37e21f3a8443b590", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.9504109772358927, "ground_truth": 0}, {"key": "0753a471e6908c35bcbc2daa37e21f3a8443b590", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.933914626365346, "ground_truth": 0}, {"key": "0753a471e6908c35bcbc2daa37e21f3a8443b590", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.9740426424096336, "ground_truth": 0}, {"key": "0753a471e6908c35bcbc2daa37e21f3a8443b590", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.9826909040735436, "ground_truth": 0}, {"key": "0753a471e6908c35bcbc2daa37e21f3a8443b590", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.9053223036507771, "ground_truth": 0}, {"key": "08450c1bc03472825196be1acb02ac0e13bef939", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.7732163696963857, "ground_truth": 0}, {"key": "08450c1bc03472825196be1acb02ac0e13bef939", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.7956580895319284, "ground_truth": 0}, {"key": "08450c1bc03472825196be1acb02ac0e13bef939", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.7248702666243071, "ground_truth": 0}, {"key": "08450c1bc03472825196be1acb02ac0e13bef939", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.9329437135194963, "ground_truth": 0}, {"key": "08450c1bc03472825196be1acb02ac0e13bef939", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.9343951641046917, "ground_truth": 0}, {"key": "7fa8d9beca50155fd3d71a9087a4311ce321c34b", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.8489721957454841, "ground_truth": 0}, {"key": "7fa8d9beca50155fd3d71a9087a4311ce321c34b", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.7520125684322571, "ground_truth": 0}, {"key": "7fa8d9beca50155fd3d71a9087a4311ce321c34b", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.7138307483019115, "ground_truth": 0}, {"key": "7fa8d9beca50155fd3d71a9087a4311ce321c34b", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.8856314670739522, "ground_truth": 0}, {"key": "7fa8d9beca50155fd3d71a9087a4311ce321c34b", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.7866228328022311, "ground_truth": 0}, {"key": "414a5b8ecbe189d2767c75b839775a1dcafaf4d3", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.5273165287402091, "ground_truth": 0}, {"key": "414a5b8ecbe189d2767c75b839775a1dcafaf4d3", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.6876299976095013, "ground_truth": 0}, {"key": "414a5b8ecbe189d2767c75b839775a1dcafaf4d3", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.6297746167919418, "ground_truth": 0}, {"key": "414a5b8ecbe189d2767c75b839775a1dcafaf4d3", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.6992544230540789, "ground_truth": 0}, {"key": "414a5b8ecbe189d2767c75b839775a1dcafaf4d3", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.6654105623188701, "ground_truth": 0}, {"key": "cac7a712935380d74410a7cba8d406235d51249a", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.9105453971780859, "ground_truth": 0}, {"key": "cac7a712935380d74410a7cba8d406235d51249a", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.9012274121308971, "ground_truth": 0}, {"key": "cac7a712935380d74410a7cba8d406235d51249a", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.8714748599799829, "ground_truth": 0}, {"key": "cac7a712935380d74410a7cba8d406235d51249a", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.9155072413649095, "ground_truth": 0}, {"key": "cac7a712935380d74410a7cba8d406235d51249a", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.9142907217067433, "ground_truth": 0}, {"key": "e9093ca0a82f2aba28cd2762942c04177cfbb000", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.8187367935147072, "ground_truth": 0}, {"key": "e9093ca0a82f2aba28cd2762942c04177cfbb000", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.8740772501379449, "ground_truth": 0}, {"key": "e9093ca0a82f2aba28cd2762942c04177cfbb000", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.6926419601504318, "ground_truth": 0}, {"key": "e9093ca0a82f2aba28cd2762942c04177cfbb000", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.8479677664997844, "ground_truth": 0}, {"key": "e9093ca0a82f2aba28cd2762942c04177cfbb000", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.7718434982299206, "ground_truth": 0}, {"key": "55a6aabd120f0b18297f7efe22452f9b3aca0d8d", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.9412234392672596, "ground_truth": 0}, {"key": "55a6aabd120f0b18297f7efe22452f9b3aca0d8d", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.9724147152134586, "ground_truth": 0}, {"key": "55a6aabd120f0b18297f7efe22452f9b3aca0d8d", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.9425067241057097, "ground_truth": 0}, {"key": "55a6aabd120f0b18297f7efe22452f9b3aca0d8d", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.9399133534672176, "ground_truth": 0}, {"key": "55a6aabd120f0b18297f7efe22452f9b3aca0d8d", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.9693242006348686, "ground_truth": 0}, {"key": "06bc2f0272d033b123e9eebbb221c62d7d51c283", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.7325918347329796, "ground_truth": 0}, {"key": "06bc2f0272d033b123e9eebbb221c62d7d51c283", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.586996425987231, "ground_truth": 0}, {"key": "06bc2f0272d033b123e9eebbb221c62d7d51c283", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.723309467768663, "ground_truth": 0}, {"key": "06bc2f0272d033b123e9eebbb221c62d7d51c283", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.7563575610489135, "ground_truth": 0}, {"key": "06bc2f0272d033b123e9eebbb221c62d7d51c283", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.7401743582683521, "ground_truth": 0}, {"key": "17e43e8e7d2bbbb237df78537d108c3fa917d9fb", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.9875683487785368, "ground_truth": 0}, {"key": "17e43e8e7d2bbbb237df78537d108c3fa917d9fb", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.9920620060800414, "ground_truth": 0}, {"key": "17e43e8e7d2bbbb237df78537d108c3fa917d9fb", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.9678992942066221, "ground_truth": 0}, {"key": "17e43e8e7d2bbbb237df78537d108c3fa917d9fb", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.9902915226657384, "ground_truth": 0}, {"key": "17e43e8e7d2bbbb237df78537d108c3fa917d9fb", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.9874720666773017, "ground_truth": 0}, {"key": "ddcdeb9bdd19fa23f9495c85d48eeee910f33102", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.9693242014254251, "ground_truth": 0}, {"key": "ddcdeb9bdd19fa23f9495c85d48eeee910f33102", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.8840392910643187, "ground_truth": 0}, {"key": "ddcdeb9bdd19fa23f9495c85d48eeee910f33102", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.9522199312270745, "ground_truth": 0}, {"key": "ddcdeb9bdd19fa23f9495c85d48eeee910f33102", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.8984105549887492, "ground_truth": 0}, {"key": "ddcdeb9bdd19fa23f9495c85d48eeee910f33102", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.9697854126065786, "ground_truth": 0}, {"key": "ee0ba7928d8987f2cb21c9a2012a76730f77de45", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.8386797591236419, "ground_truth": 0}, {"key": "ee0ba7928d8987f2cb21c9a2012a76730f77de45", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.7786493032937657, "ground_truth": 0}, {"key": "ee0ba7928d8987f2cb21c9a2012a76730f77de45", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.8587185835117402, "ground_truth": 0}, {"key": "ee0ba7928d8987f2cb21c9a2012a76730f77de45", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.6531269137479744, "ground_truth": 0}, {"key": "ee0ba7928d8987f2cb21c9a2012a76730f77de45", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.8164063677137255, "ground_truth": 0}, {"key": "554fd99f28ae12472c5d99ef6383bb184744c25a", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.831143046284132, "ground_truth": 0}, {"key": "554fd99f28ae12472c5d99ef6383bb184744c25a", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.8116760106524867, "ground_truth": 0}, {"key": "554fd99f28ae12472c5d99ef6383bb184744c25a", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.7476159414828406, "ground_truth": 0}, {"key": "554fd99f28ae12472c5d99ef6383bb184744c25a", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.738669063549018, "ground_truth": 0}, {"key": "554fd99f28ae12472c5d99ef6383bb184744c25a", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.8799743644779116, "ground_truth": 0}, {"key": "9e141ebc1c06d483bf85f4e5c8b3c7bc2d00ea2f", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.8962513708995351, "ground_truth": 0}, {"key": "9e141ebc1c06d483bf85f4e5c8b3c7bc2d00ea2f", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.8976952945685055, "ground_truth": 0}, {"key": "9e141ebc1c06d483bf85f4e5c8b3c7bc2d00ea2f", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.8615382016510231, "ground_truth": 0}, {"key": "9e141ebc1c06d483bf85f4e5c8b3c7bc2d00ea2f", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.9299510376389908, "ground_truth": 0}, {"key": "9e141ebc1c06d483bf85f4e5c8b3c7bc2d00ea2f", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.8864204129648174, "ground_truth": 0}, {"key": "c9160e2f5ce386dabb10517e7a5c0933c01a9546", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.7866228332613668, "ground_truth": 0}, {"key": "c9160e2f5ce386dabb10517e7a5c0933c01a9546", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.8386797584303809, "ground_truth": 0}, {"key": "c9160e2f5ce386dabb10517e7a5c0933c01a9546", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.7839884652689596, "ground_truth": 0}, {"key": "c9160e2f5ce386dabb10517e7a5c0933c01a9546", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.7853085884355085, "ground_truth": 0}, {"key": "c9160e2f5ce386dabb10517e7a5c0933c01a9546", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.8092759754153543, "ground_truth": 0}, {"key": "d256aee1a47eb5b489dee6fb72ab7f7d1483a37f", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.744656349345866, "ground_truth": 0}, {"key": "d256aee1a47eb5b489dee6fb72ab7f7d1483a37f", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.7732163637935192, "ground_truth": 0}, {"key": "d256aee1a47eb5b489dee6fb72ab7f7d1483a37f", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.6909762667986586, "ground_truth": 0}, {"key": "d256aee1a47eb5b489dee6fb72ab7f7d1483a37f", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.8044059160245881, "ground_truth": 0}, {"key": "d256aee1a47eb5b489dee6fb72ab7f7d1483a37f", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.7341195138834339, "ground_truth": 0}, {"key": "2fff2bc541ef34a6647dfa2e4294cdcc187e47b9", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.8233283903949549, "ground_truth": 0}, {"key": "2fff2bc541ef34a6647dfa2e4294cdcc187e47b9", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.8365545763291367, "ground_truth": 0}, {"key": "2fff2bc541ef34a6647dfa2e4294cdcc187e47b9", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.8267118013342883, "ground_truth": 0}, {"key": "2fff2bc541ef34a6647dfa2e4294cdcc187e47b9", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.7648916060524478, "ground_truth": 0}, {"key": "2fff2bc541ef34a6647dfa2e4294cdcc187e47b9", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.8068526198466025, "ground_truth": 0}, {"key": "677375a4c69e81ab623af7c06a6b0a8d03d6350e", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.7931059514124654, "ground_truth": 0}, {"key": "677375a4c69e81ab623af7c06a6b0a8d03d6350e", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.7853085780832313, "ground_truth": 0}, {"key": "677375a4c69e81ab623af7c06a6b0a8d03d6350e", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.7905302998391316, "ground_truth": 0}, {"key": "677375a4c69e81ab623af7c06a6b0a8d03d6350e", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.8606036208665462, "ground_truth": 0}, {"key": "677375a4c69e81ab623af7c06a6b0a8d03d6350e", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.7732163701284589, "ground_truth": 0}, {"key": "33530f97118cc905b05cb920671492c7bfdf3a3b", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.8558511638082527, "ground_truth": 0}, {"key": "33530f97118cc905b05cb920671492c7bfdf3a3b", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.9372107904106973, "ground_truth": 0}, {"key": "33530f97118cc905b05cb920671492c7bfdf3a3b", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.8848377699559972, "ground_truth": 0}, {"key": "33530f97118cc905b05cb920671492c7bfdf3a3b", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.8365545684421289, "ground_truth": 0}, {"key": "33530f97118cc905b05cb920671492c7bfdf3a3b", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.8740772391954854, "ground_truth": 0}, {"key": "3c19a753303ae0d67b3ae28e070c0f4157ffc52d", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.849971180907589, "ground_truth": 0}, {"key": "3c19a753303ae0d67b3ae28e070c0f4157ffc52d", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.8469578360887758, "ground_truth": 0}, {"key": "3c19a753303ae0d67b3ae28e070c0f4157ffc52d", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.7826624826136845, "ground_truth": 0}, {"key": "3c19a753303ae0d67b3ae28e070c0f4157ffc52d", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.6723316904427499, "ground_truth": 0}, {"key": "3c19a753303ae0d67b3ae28e070c0f4157ffc52d", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.8386797675678873, "ground_truth": 0}, {"key": "9313988d26672c576f08e130c895edf20d8aa626", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.8998277741511117, "ground_truth": 0}, {"key": "9313988d26672c576f08e130c895edf20d8aa626", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.8519528074758804, "ground_truth": 0}, {"key": "9313988d26672c576f08e130c895edf20d8aa626", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.8856314787596958, "ground_truth": 0}, {"key": "9313988d26672c576f08e130c895edf20d8aa626", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.9026095983626097, "ground_truth": 0}, {"key": "9313988d26672c576f08e130c895edf20d8aa626", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.926835282873945, "ground_truth": 0}, {"key": "72f4a6670ec7ec915c83d58bb0ebf152b1605bb6", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.911809951026066, "ground_truth": 0}, {"key": "72f4a6670ec7ec915c83d58bb0ebf152b1605bb6", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.9246876909740559, "ground_truth": 0}, {"key": "72f4a6670ec7ec915c83d58bb0ebf152b1605bb6", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.8962513786407826, "ground_truth": 0}, {"key": "72f4a6670ec7ec915c83d58bb0ebf152b1605bb6", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.9178933741393314, "ground_truth": 0}, {"key": "72f4a6670ec7ec915c83d58bb0ebf152b1605bb6", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.9053222934247246, "ground_truth": 0}, {"key": "b73f50e29d5b2943eb315643bef8ee4e09f5605b", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.6959583089252508, "ground_truth": 0}, {"key": "b73f50e29d5b2943eb315643bef8ee4e09f5605b", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.7264256124888107, "ground_truth": 0}, {"key": "b73f50e29d5b2943eb315643bef8ee4e09f5605b", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.6460136757857639, "ground_truth": 0}, {"key": "b73f50e29d5b2943eb315643bef8ee4e09f5605b", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.7505527732488745, "ground_truth": 0}, {"key": "b73f50e29d5b2943eb315643bef8ee4e09f5605b", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.7154239917674446, "ground_truth": 0}, {"key": "f9689fb9656132e1c6d186851563f2b968643791", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.7549149939362646, "ground_truth": 0}, {"key": "f9689fb9656132e1c6d186851563f2b968643791", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.8092759690150657, "ground_truth": 0}, {"key": "f9689fb9656132e1c6d186851563f2b968643791", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.7310585435059987, "ground_truth": 0}, {"key": "f9689fb9656132e1c6d186851563f2b968643791", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.7918210690732385, "ground_truth": 0}, {"key": "f9689fb9656132e1c6d186851563f2b968643791", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.8449215240090401, "ground_truth": 0}, {"key": "63831b842812b1a3d05b04904a10d160fe7ad2af", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.9263037276115857, "ground_truth": 0}, {"key": "63831b842812b1a3d05b04904a10d160fe7ad2af", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.9268352816759404, "ground_truth": 0}, {"key": "63831b842812b1a3d05b04904a10d160fe7ad2af", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.9437636504481659, "ground_truth": 0}, {"key": "63831b842812b1a3d05b04904a10d160fe7ad2af", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.9500414795769245, "ground_truth": 0}, {"key": "63831b842812b1a3d05b04904a10d160fe7ad2af", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.919642532586829, "ground_truth": 0}, {"key": "05688bac0e46542be65a6df240428a6f26c86fd0", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.9594592618309193, "ground_truth": 0}, {"key": "05688bac0e46542be65a6df240428a6f26c86fd0", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.9394706070595843, "ground_truth": 0}, {"key": "05688bac0e46542be65a6df240428a6f26c86fd0", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.9623913654010363, "ground_truth": 0}, {"key": "05688bac0e46542be65a6df240428a6f26c86fd0", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.9813106908669733, "ground_truth": 0}, {"key": "05688bac0e46542be65a6df240428a6f26c86fd0", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.9492946344640767, "ground_truth": 0}, {"key": "5ba0d22ccba29ac8a3c77da069165d6016f5a214", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.8428631384133429, "ground_truth": 0}, {"key": "5ba0d22ccba29ac8a3c77da069165d6016f5a214", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.8688267766776216, "ground_truth": 0}, {"key": "5ba0d22ccba29ac8a3c77da069165d6016f5a214", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.8879840502303382, "ground_truth": 0}, {"key": "5ba0d22ccba29ac8a3c77da069165d6016f5a214", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.833324599854329, "ground_truth": 0}, {"key": "5ba0d22ccba29ac8a3c77da069165d6016f5a214", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.8918110359341896, "ground_truth": 0}, {"key": "9f63d6256158d260c426a9336d19b760d9bc5a48", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.846957849479648, "ground_truth": 0}, {"key": "9f63d6256158d260c426a9336d19b760d9bc5a48", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.8300437693360495, "ground_truth": 0}, {"key": "9f63d6256158d260c426a9336d19b760d9bc5a48", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.7994423155054304, "ground_truth": 0}, {"key": "9f63d6256158d260c426a9336d19b760d9bc5a48", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.8152324894381475, "ground_truth": 0}, {"key": "9f63d6256158d260c426a9336d19b760d9bc5a48", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.8864204077381844, "ground_truth": 0}, {"key": "fb6516de631cade629b797e8f40f377523c4aa0e", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.9372107903848682, "ground_truth": 0}, {"key": "fb6516de631cade629b797e8f40f377523c4aa0e", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.9118099578576732, "ground_truth": 0}, {"key": "fb6516de631cade629b797e8f40f377523c4aa0e", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.9294404032638134, "ground_truth": 0}, {"key": "fb6516de631cade629b797e8f40f377523c4aa0e", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.9161096109242506, "ground_truth": 0}, {"key": "fb6516de631cade629b797e8f40f377523c4aa0e", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.9556514177266158, "ground_truth": 0}, {"key": "0a71f063b78184b4ca2ffee3c642d48dc27ef91b", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.7994423230147185, "ground_truth": 0}, {"key": "0a71f063b78184b4ca2ffee3c642d48dc27ef91b", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.7704647802143202, "ground_truth": 0}, {"key": "0a71f063b78184b4ca2ffee3c642d48dc27ef91b", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.791821076139655, "ground_truth": 0}, {"key": "0a71f063b78184b4ca2ffee3c642d48dc27ef91b", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.8438950878107755, "ground_truth": 0}, {"key": "0a71f063b78184b4ca2ffee3c642d48dc27ef91b", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.8529354702053409, "ground_truth": 0}, {"key": "700e0d133d2f5c2e65960aae7bffa66bb62c0df4", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.704160137944937, "ground_truth": 0}, {"key": "700e0d133d2f5c2e65960aae7bffa66bb62c0df4", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.7401743830930165, "ground_truth": 0}, {"key": "700e0d133d2f5c2e65960aae7bffa66bb62c0df4", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.7969253670109311, "ground_truth": 0}, {"key": "700e0d133d2f5c2e65960aae7bffa66bb62c0df4", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.8848377618099982, "ground_truth": 0}, {"key": "700e0d133d2f5c2e65960aae7bffa66bb62c0df4", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.7981867861593971, "ground_truth": 0}, {"key": "180642a2ddfce93ceaf3ee3ec4779400fe67ae1e", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.7981867765410375, "ground_truth": 0}, {"key": "180642a2ddfce93ceaf3ee3ec4779400fe67ae1e", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.7106283281374379, "ground_truth": 0}, {"key": "180642a2ddfce93ceaf3ee3ec4779400fe67ae1e", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.8187367929912837, "ground_truth": 0}, {"key": "180642a2ddfce93ceaf3ee3ec4779400fe67ae1e", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.8164063905535303, "ground_truth": 0}, {"key": "180642a2ddfce93ceaf3ee3ec4779400fe67ae1e", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.790530313190961, "ground_truth": 0}, {"key": "3e868fbad714ceab14a41fa9dd5d8a40204f2199", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.9086178943461841, "ground_truth": 0}, {"key": "3e868fbad714ceab14a41fa9dd5d8a40204f2199", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.8164063769512154, "ground_truth": 0}, {"key": "3e868fbad714ceab14a41fa9dd5d8a40204f2199", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.9167080753655322, "ground_truth": 0}, {"key": "3e868fbad714ceab14a41fa9dd5d8a40204f2199", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.8840392833091694, "ground_truth": 0}, {"key": "3e868fbad714ceab14a41fa9dd5d8a40204f2199", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.9284088021859424, "ground_truth": 0}, {"key": "8b0a818edcbbefb79dd40a19b08119f6848083db", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.9005297938969508, "ground_truth": 0}, {"key": "8b0a818edcbbefb79dd40a19b08119f6848083db", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.8300437693360495, "ground_truth": 0}, {"key": "8b0a818edcbbefb79dd40a19b08119f6848083db", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.7799929057532405, "ground_truth": 0}, {"key": "8b0a818edcbbefb79dd40a19b08119f6848083db", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.7201714987664405, "ground_truth": 0}, {"key": "8b0a818edcbbefb79dd40a19b08119f6848083db", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.9079671439817459, "ground_truth": 0}, {"key": "ceb7a288ac1ad604a17bc25c5978fcc87b1a4446", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.9543079664197572, "ground_truth": 0}, {"key": "ceb7a288ac1ad604a17bc25c5978fcc87b1a4446", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.9032942076801574, "ground_truth": 0}, {"key": "ceb7a288ac1ad604a17bc25c5978fcc87b1a4446", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.9656413099202666, "ground_truth": 0}, {"key": "ceb7a288ac1ad604a17bc25c5978fcc87b1a4446", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.8998277737477858, "ground_truth": 0}, {"key": "ceb7a288ac1ad604a17bc25c5978fcc87b1a4446", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.9770226287798802, "ground_truth": 0}, {"key": "a228e744966fe03eca515b971329acacf9feabb2", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.8925625266022097, "ground_truth": 0}, {"key": "a228e744966fe03eca515b971329acacf9feabb2", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.9294404017046408, "ground_truth": 0}, {"key": "a228e744966fe03eca515b971329acacf9feabb2", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.9412234442463274, "ground_truth": 0}, {"key": "a228e744966fe03eca515b971329acacf9feabb2", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.9059898079400738, "ground_truth": 0}, {"key": "a228e744966fe03eca515b971329acacf9feabb2", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.9385759643489738, "ground_truth": 0}, {"key": "c44238ec87e7fc40ab7fe6e724cfcbf301e01216", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.8856314828545897, "ground_truth": 0}, {"key": "c44238ec87e7fc40ab7fe6e724cfcbf301e01216", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.7931059640370369, "ground_truth": 0}, {"key": "c44238ec87e7fc40ab7fe6e724cfcbf301e01216", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.7431680236483789, "ground_truth": 0}, {"key": "c44238ec87e7fc40ab7fe6e724cfcbf301e01216", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.7648916089138087, "ground_truth": 0}, {"key": "c44238ec87e7fc40ab7fe6e724cfcbf301e01216", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.7676898404749177, "ground_truth": 0}, {"key": "fff32094b00f3780cc98fe43bd98aace4b851281", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.9473810450507157, "ground_truth": 0}, {"key": "fff32094b00f3780cc98fe43bd98aace4b851281", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.9504109749981701, "ground_truth": 0}, {"key": "fff32094b00f3780cc98fe43bd98aace4b851281", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.8128673136634835, "ground_truth": 0}, {"key": "fff32094b00f3780cc98fe43bd98aace4b851281", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.9441768567127086, "ground_truth": 0}, {"key": "fff32094b00f3780cc98fe43bd98aace4b851281", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.9348724481217425, "ground_truth": 0}, {"key": "373ef5be1d84b8c4905193e569e0cf8a7ead3d03", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.9202179841467526, "ground_truth": 0}, {"key": "373ef5be1d84b8c4905193e569e0cf8a7ead3d03", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.8918110440814646, "ground_truth": 0}, {"key": "373ef5be1d84b8c4905193e569e0cf8a7ead3d03", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.9358173558442813, "ground_truth": 0}, {"key": "373ef5be1d84b8c4905193e569e0cf8a7ead3d03", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.9086178947014498, "ground_truth": 0}, {"key": "373ef5be1d84b8c4905193e569e0cf8a7ead3d03", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.9099070101076795, "ground_truth": 0}, {"key": "f372b28e3d1f74d60aa8ee29d7bdd49a6e7f9779", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.9842154392824712, "ground_truth": 0}, {"key": "f372b28e3d1f74d60aa8ee29d7bdd49a6e7f9779", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.9843363519266163, "ground_truth": 0}, {"key": "f372b28e3d1f74d60aa8ee29d7bdd49a6e7f9779", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.9445872115660748, "ground_truth": 0}, {"key": "f372b28e3d1f74d60aa8ee29d7bdd49a6e7f9779", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.9884026384548472, "ground_truth": 0}, {"key": "f372b28e3d1f74d60aa8ee29d7bdd49a6e7f9779", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.968381232531068, "ground_truth": 0}, {"key": "fbcaa7519e9ff82193afbaed67d8706f2350125f", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.8969755600731445, "ground_truth": 0}, {"key": "fbcaa7519e9ff82193afbaed67d8706f2350125f", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.9105453935548254, "ground_truth": 0}, {"key": "fbcaa7519e9ff82193afbaed67d8706f2350125f", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.8840392733192827, "ground_truth": 0}, {"key": "fbcaa7519e9ff82193afbaed67d8706f2350125f", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.8807970863150519, "ground_truth": 0}, {"key": "fbcaa7519e9ff82193afbaed67d8706f2350125f", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.877476795239752, "ground_truth": 0}, {"key": "5ebd041d89a2ba41b387c30293f0657eef746910", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.7122321625375115, "ground_truth": 0}, {"key": "5ebd041d89a2ba41b387c30293f0657eef746910", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.6774739890392892, "ground_truth": 0}, {"key": "5ebd041d89a2ba41b387c30293f0657eef746910", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.7461389831979998, "ground_truth": 0}, {"key": "5ebd041d89a2ba41b387c30293f0657eef746910", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.7371581627114537, "ground_truth": 0}, {"key": "5ebd041d89a2ba41b387c30293f0657eef746910", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.6943026535040058, "ground_truth": 0}, {"key": "ac4ae79796d05506dabe4380c24f7dd423e09965", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.7248702875133959, "ground_truth": 0}, {"key": "ac4ae79796d05506dabe4380c24f7dd423e09965", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.8633916122002938, "ground_truth": 0}, {"key": "ac4ae79796d05506dabe4380c24f7dd423e09965", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.7170118947073898, "ground_truth": 0}, {"key": "ac4ae79796d05506dabe4380c24f7dd423e09965", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.76348376531689, "ground_truth": 0}, {"key": "ac4ae79796d05506dabe4380c24f7dd423e09965", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.8019358301660166, "ground_truth": 0}, {"key": "62827a1a377491d88adcbac25ecf14a64b5f997b", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.9309620735509047, "ground_truth": 0}, {"key": "62827a1a377491d88adcbac25ecf14a64b5f997b", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.8558511415550293, "ground_truth": 0}, {"key": "62827a1a377491d88adcbac25ecf14a64b5f997b", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.905989810060626, "ground_truth": 0}, {"key": "62827a1a377491d88adcbac25ecf14a64b5f997b", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.8354835473602008, "ground_truth": 0}, {"key": "62827a1a377491d88adcbac25ecf14a64b5f997b", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.7905303039572656, "ground_truth": 0}, {"key": "d42463e1093a92ec4dbd20edd8f4bf3306f00f3f", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.8910549548880788, "ground_truth": 0}, {"key": "d42463e1093a92ec4dbd20edd8f4bf3306f00f3f", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.7918210745484935, "ground_truth": 0}, {"key": "d42463e1093a92ec4dbd20edd8f4bf3306f00f3f", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.8068526311912169, "ground_truth": 0}, {"key": "d42463e1093a92ec4dbd20edd8f4bf3306f00f3f", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.8311430503083864, "ground_truth": 0}, {"key": "d42463e1093a92ec4dbd20edd8f4bf3306f00f3f", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.762070111665615, "ground_truth": 0}, {"key": "4b0eda92463958cce8c6b2537db39088e1254552", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.8887587870171674, "ground_truth": 0}, {"key": "4b0eda92463958cce8c6b2537db39088e1254552", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.9294404036598584, "ground_truth": 0}, {"key": "4b0eda92463958cce8c6b2537db39088e1254552", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.9437636539845325, "ground_truth": 0}, {"key": "4b0eda92463958cce8c6b2537db39088e1254552", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.9202179854364978, "ground_truth": 0}, {"key": "4b0eda92463958cce8c6b2537db39088e1254552", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.918480247616522, "ground_truth": 0}, {"key": "e117408ad19cc69e15b1e21b9ae54f10c07223ce", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.8791467746444929, "ground_truth": 0}, {"key": "e117408ad19cc69e15b1e21b9ae54f10c07223ce", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.8955226816376199, "ground_truth": 0}, {"key": "e117408ad19cc69e15b1e21b9ae54f10c07223ce", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.8354835505416865, "ground_truth": 0}, {"key": "e117408ad19cc69e15b1e21b9ae54f10c07223ce", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.8104789049970882, "ground_truth": 0}, {"key": "e117408ad19cc69e15b1e21b9ae54f10c07223ce", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.8300437656775911, "ground_truth": 0}, {"key": "3c5b68b58c34853baa534d1265ec7fde00d4eb4e", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.8749346129510539, "ground_truth": 0}, {"key": "3c5b68b58c34853baa534d1265ec7fde00d4eb4e", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.7799929065356196, "ground_truth": 0}, {"key": "3c5b68b58c34853baa534d1265ec7fde00d4eb4e", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.8723473877165238, "ground_truth": 0}, {"key": "3c5b68b58c34853baa534d1265ec7fde00d4eb4e", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.6893056009830741, "ground_truth": 0}, {"key": "3c5b68b58c34853baa534d1265ec7fde00d4eb4e", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.8947894605288589, "ground_truth": 0}, {"key": "6c3d2feed04c75063d182103f0585c45da9aaa1b", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.8714748657895119, "ground_truth": 0}, {"key": "6c3d2feed04c75063d182103f0585c45da9aaa1b", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.8670357609810395, "ground_truth": 0}, {"key": "6c3d2feed04c75063d182103f0585c45da9aaa1b", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.7676898434133219, "ground_truth": 0}, {"key": "6c3d2feed04c75063d182103f0585c45da9aaa1b", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.8116760115586917, "ground_truth": 0}, {"key": "6c3d2feed04c75063d182103f0585c45da9aaa1b", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.8267117953376054, "ground_truth": 0}, {"key": "4fa1c0bd7f86368d7ae7730d95ff7e73dc9172da", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.9284088025022286, "ground_truth": 0}, {"key": "4fa1c0bd7f86368d7ae7730d95ff7e73dc9172da", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.9563089432103739, "ground_truth": 0}, {"key": "4fa1c0bd7f86368d7ae7730d95ff7e73dc9172da", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.9612438079343211, "ground_truth": 0}, {"key": "4fa1c0bd7f86368d7ae7730d95ff7e73dc9172da", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.9385759576162952, "ground_truth": 0}, {"key": "4fa1c0bd7f86368d7ae7730d95ff7e73dc9172da", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.965641311877603, "ground_truth": 0}, {"key": "282f1910bd57e50d4401c695ebe75b817de68548", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.9099069989992938, "ground_truth": 0}, {"key": "282f1910bd57e50d4401c695ebe75b817de68548", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.8539127590118076, "ground_truth": 0}, {"key": "282f1910bd57e50d4401c695ebe75b817de68548", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.8397339720246696, "ground_truth": 0}, {"key": "282f1910bd57e50d4401c695ebe75b817de68548", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.8661325009360364, "ground_truth": 0}, {"key": "282f1910bd57e50d4401c695ebe75b817de68548", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.9329437151886106, "ground_truth": 0}, {"key": "af2d712599be471d1ba0b91fa18c347220ca595d", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.6842640376605925, "ground_truth": 0}, {"key": "af2d712599be471d1ba0b91fa18c347220ca595d", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.7772998545705854, "ground_truth": 0}, {"key": "af2d712599be471d1ba0b91fa18c347220ca595d", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.8031738029660651, "ground_truth": 0}, {"key": "af2d712599be471d1ba0b91fa18c347220ca595d", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.5907791927233038, "ground_truth": 0}, {"key": "af2d712599be471d1ba0b91fa18c347220ca595d", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.6671477039730104, "ground_truth": 0}, {"key": "e3dd06d326c8d53722bdc5c8428e29c68a60d0d5", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.886420415148632, "ground_truth": 0}, {"key": "e3dd06d326c8d53722bdc5c8428e29c68a60d0d5", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.9394706079137902, "ground_truth": 0}, {"key": "e3dd06d326c8d53722bdc5c8428e29c68a60d0d5", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.9059898157793173, "ground_truth": 0}, {"key": "e3dd06d326c8d53722bdc5c8428e29c68a60d0d5", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.8783142507905842, "ground_truth": 0}, {"key": "e3dd06d326c8d53722bdc5c8428e29c68a60d0d5", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.8955226768424682, "ground_truth": 0}, {"key": "493fa8c40d1bc26ed1d25633c779b13bc33efdba", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.806852622917936, "ground_truth": 0}, {"key": "493fa8c40d1bc26ed1d25633c779b13bc33efdba", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.8289388075548787, "ground_truth": 0}, {"key": "493fa8c40d1bc26ed1d25633c779b13bc33efdba", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.8902942397352963, "ground_truth": 0}, {"key": "493fa8c40d1bc26ed1d25633c779b13bc33efdba", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.8210441159838064, "ground_truth": 0}, {"key": "493fa8c40d1bc26ed1d25633c779b13bc33efdba", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.7341195383639423, "ground_truth": 0}, {"key": "56d7d67bb0fc32ee71cc006b915244776d883661", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.8615382069598484, "ground_truth": 0}, {"key": "56d7d67bb0fc32ee71cc006b915244776d883661", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.9079671309029964, "ground_truth": 0}, {"key": "56d7d67bb0fc32ee71cc006b915244776d883661", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.8615382163973759, "ground_truth": 0}, {"key": "56d7d67bb0fc32ee71cc006b915244776d883661", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.7732163623789828, "ground_truth": 0}, {"key": "56d7d67bb0fc32ee71cc006b915244776d883661", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.8816148989725001, "ground_truth": 0}, {"key": "2b08ee205946dc0bb6ffe0db654cbbba1199eb28", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.9026095970789493, "ground_truth": 0}, {"key": "2b08ee205946dc0bb6ffe0db654cbbba1199eb28", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.8840392889670003, "ground_truth": 0}, {"key": "2b08ee205946dc0bb6ffe0db654cbbba1199eb28", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.9066531289080966, "ground_truth": 0}, {"key": "2b08ee205946dc0bb6ffe0db654cbbba1199eb28", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.9118099574774301, "ground_truth": 0}, {"key": "2b08ee205946dc0bb6ffe0db654cbbba1199eb28", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.8519528079496916, "ground_truth": 0}, {"key": "782c4bdaee73189103d2e05748717b3ea0e89e5d", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.7732163606848348, "ground_truth": 0}, {"key": "782c4bdaee73189103d2e05748717b3ea0e89e5d", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.8322366531588303, "ground_truth": 0}, {"key": "782c4bdaee73189103d2e05748717b3ea0e89e5d", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.7138307599530008, "ground_truth": 0}, {"key": "782c4bdaee73189103d2e05748717b3ea0e89e5d", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.7233094686849544, "ground_truth": 0}, {"key": "782c4bdaee73189103d2e05748717b3ea0e89e5d", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.8832359885680373, "ground_truth": 0}, {"key": "87385fb51ac9eaf76e8421723c94410f724750fc", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.8910549598260936, "ground_truth": 0}, {"key": "87385fb51ac9eaf76e8421723c94410f724750fc", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.9324533104459809, "ground_truth": 0}, {"key": "87385fb51ac9eaf76e8421723c94410f724750fc", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.9329437172791344, "ground_truth": 0}, {"key": "87385fb51ac9eaf76e8421723c94410f724750fc", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.9235923188721794, "ground_truth": 0}, {"key": "87385fb51ac9eaf76e8421723c94410f724750fc", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.9289263305997684, "ground_truth": 0}, {"key": "20528eb48341b50c0083fcf5a9d114b39040e5c1", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.884039282374357, "ground_truth": 0}, {"key": "20528eb48341b50c0083fcf5a9d114b39040e5c1", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.9358173599919726, "ground_truth": 0}, {"key": "20528eb48341b50c0083fcf5a9d114b39040e5c1", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.8354835383540461, "ground_truth": 0}, {"key": "20528eb48341b50c0083fcf5a9d114b39040e5c1", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.9196425385493998, "ground_truth": 0}, {"key": "20528eb48341b50c0083fcf5a9d114b39040e5c1", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.9289263355407673, "ground_truth": 0}, {"key": "412630c97420afb50e5278d3406e0cf4b08d0b77", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.854884638081092, "ground_truth": 0}, {"key": "412630c97420afb50e5278d3406e0cf4b08d0b77", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.7718435033016023, "ground_truth": 0}, {"key": "412630c97420afb50e5278d3406e0cf4b08d0b77", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.8714748639051773, "ground_truth": 0}, {"key": "412630c97420afb50e5278d3406e0cf4b08d0b77", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.88875877856508, "ground_truth": 0}, {"key": "412630c97420afb50e5278d3406e0cf4b08d0b77", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.8705972713946445, "ground_truth": 0}, {"key": "dcd60a85e1e17ec0163a925c9412d480fd08072f", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.8832359870604689, "ground_truth": 0}, {"key": "dcd60a85e1e17ec0163a925c9412d480fd08072f", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.9353465080403043, "ground_truth": 0}, {"key": "dcd60a85e1e17ec0163a925c9412d480fd08072f", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.8910549560054937, "ground_truth": 0}, {"key": "dcd60a85e1e17ec0163a925c9412d480fd08072f", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.879146768611822, "ground_truth": 0}, {"key": "dcd60a85e1e17ec0163a925c9412d480fd08072f", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.923039159972071, "ground_truth": 0}, {"key": "805644d370fae7b0492174c54c00e86eff742735", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.7592254054049521, "ground_truth": 0}, {"key": "805644d370fae7b0492174c54c00e86eff742735", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.7401743837073346, "ground_truth": 0}, {"key": "805644d370fae7b0492174c54c00e86eff742735", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.7549149995513242, "ground_truth": 0}, {"key": "805644d370fae7b0492174c54c00e86eff742735", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.6876299754013954, "ground_truth": 0}, {"key": "805644d370fae7b0492174c54c00e86eff742735", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.7534666686180048, "ground_truth": 0}, {"key": "3aa0ef8cac31a60076c43a9484792b59372edb64", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.866132511918938, "ground_truth": 0}, {"key": "3aa0ef8cac31a60076c43a9484792b59372edb64", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.9039745006441872, "ground_truth": 0}, {"key": "3aa0ef8cac31a60076c43a9484792b59372edb64", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.8568122962859714, "ground_truth": 0}, {"key": "3aa0ef8cac31a60076c43a9484792b59372edb64", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.849971185432523, "ground_truth": 0}, {"key": "3aa0ef8cac31a60076c43a9484792b59372edb64", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.9005297857532315, "ground_truth": 0}, {"key": "4cf51ce9372dff8ff7f44f098eab1c1d7569af7a", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.9294404015897878, "ground_truth": 0}, {"key": "4cf51ce9372dff8ff7f44f098eab1c1d7569af7a", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.8976952954062557, "ground_truth": 0}, {"key": "4cf51ce9372dff8ff7f44f098eab1c1d7569af7a", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.894789461921682, "ground_truth": 0}, {"key": "4cf51ce9372dff8ff7f44f098eab1c1d7569af7a", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.8705972692330307, "ground_truth": 0}, {"key": "4cf51ce9372dff8ff7f44f098eab1c1d7569af7a", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.8449215284114386, "ground_truth": 0}, {"key": "ea06fd0b25cb9793397a51de73fd83f91b4323fa", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.8766343815784765, "ground_truth": 0}, {"key": "ea06fd0b25cb9793397a51de73fd83f91b4323fa", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.8723473799564404, "ground_truth": 0}, {"key": "ea06fd0b25cb9793397a51de73fd83f91b4323fa", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.9053222981899388, "ground_truth": 0}, {"key": "ea06fd0b25cb9793397a51de73fd83f91b4323fa", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.7476159552781138, "ground_truth": 0}, {"key": "ea06fd0b25cb9793397a51de73fd83f91b4323fa", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.8705972720595694, "ground_truth": 0}, {"key": "a150e93fa52eaba281aae9eabe28b3ee4155f296", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.4610167997703648, "ground_truth": 0}, {"key": "a150e93fa52eaba281aae9eabe28b3ee4155f296", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.7371581532511834, "ground_truth": 0}, {"key": "a150e93fa52eaba281aae9eabe28b3ee4155f296", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.74017435729, "ground_truth": 0}, {"key": "a150e93fa52eaba281aae9eabe28b3ee4155f296", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.6654105456777939, "ground_truth": 0}, {"key": "a150e93fa52eaba281aae9eabe28b3ee4155f296", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.7170118976505973, "ground_truth": 0}, {"key": "a0a84718168357049273f6e65133fd06e67cd6d2", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.8807970780145138, "ground_truth": 0}, {"key": "a0a84718168357049273f6e65133fd06e67cd6d2", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.8489722078417793, "ground_truth": 0}, {"key": "a0a84718168357049273f6e65133fd06e67cd6d2", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.8489721837361772, "ground_truth": 0}, {"key": "a0a84718168357049273f6e65133fd06e67cd6d2", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.7676898512399117, "ground_truth": 0}, {"key": "a0a84718168357049273f6e65133fd06e67cd6d2", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.8791467590569906, "ground_truth": 0}, {"key": "b5833a27ee69d7540435e3c70af040c2b743f541", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.7371581572750495, "ground_truth": 0}, {"key": "b5833a27ee69d7540435e3c70af040c2b743f541", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.6976089189513136, "ground_truth": 0}, {"key": "b5833a27ee69d7540435e3c70af040c2b743f541", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.854884642235759, "ground_truth": 0}, {"key": "b5833a27ee69d7540435e3c70af040c2b743f541", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.7786493042826602, "ground_truth": 0}, {"key": "b5833a27ee69d7540435e3c70af040c2b743f541", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.7446563613068714, "ground_truth": 0}, {"key": "98dbba54da2a05bb04320aa0e4fb05fba3d75b63", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.8289388038406134, "ground_truth": 0}, {"key": "98dbba54da2a05bb04320aa0e4fb05fba3d75b63", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.7772998694652482, "ground_truth": 0}, {"key": "98dbba54da2a05bb04320aa0e4fb05fba3d75b63", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.7592254306584946, "ground_truth": 0}, {"key": "98dbba54da2a05bb04320aa0e4fb05fba3d75b63", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.8187367947374953, "ground_truth": 0}, {"key": "98dbba54da2a05bb04320aa0e4fb05fba3d75b63", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.8210441193710128, "ground_truth": 0}, {"key": "4a30d8e9ba08a56c1d503d719525113545c414e3", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.8092759784813998, "ground_truth": 0}, {"key": "4a30d8e9ba08a56c1d503d719525113545c414e3", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.9167080728963604, "ground_truth": 0}, {"key": "4a30d8e9ba08a56c1d503d719525113545c414e3", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.9066531249021564, "ground_truth": 0}, {"key": "4a30d8e9ba08a56c1d503d719525113545c414e3", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.6943026804441728, "ground_truth": 0}, {"key": "4a30d8e9ba08a56c1d503d719525113545c414e3", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.8872046022951515, "ground_truth": 0}, {"key": "c3acabb0c18cc7615eb3796406500fba1b148d3d", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.9230391610144035, "ground_truth": 0}, {"key": "c3acabb0c18cc7615eb3796406500fba1b148d3d", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.861538206848695, "ground_truth": 0}, {"key": "c3acabb0c18cc7615eb3796406500fba1b148d3d", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.8652240840913044, "ground_truth": 0}, {"key": "c3acabb0c18cc7615eb3796406500fba1b148d3d", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.890294223242464, "ground_truth": 0}, {"key": "c3acabb0c18cc7615eb3796406500fba1b148d3d", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.9136765255622716, "ground_truth": 0}, {"key": "1c1acc74329fe61636f900df9dbcef5ed695e5c9", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.8918110476625729, "ground_truth": 0}, {"key": "1c1acc74329fe61636f900df9dbcef5ed695e5c9", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.903974514877668, "ground_truth": 0}, {"key": "1c1acc74329fe61636f900df9dbcef5ed695e5c9", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.8679338558039287, "ground_truth": 0}, {"key": "1c1acc74329fe61636f900df9dbcef5ed695e5c9", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.8723473751806397, "ground_truth": 0}, {"key": "1c1acc74329fe61636f900df9dbcef5ed695e5c9", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.8386797697577977, "ground_truth": 0}, {"key": "f70a7abb6c5b0ef383ea12a4d9ca046a5bd854e5", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.7461389882426727, "ground_truth": 0}, {"key": "f70a7abb6c5b0ef383ea12a4d9ca046a5bd854e5", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.8643104619849716, "ground_truth": 0}, {"key": "f70a7abb6c5b0ef383ea12a4d9ca046a5bd854e5", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.7772998543904598, "ground_truth": 0}, {"key": "f70a7abb6c5b0ef383ea12a4d9ca046a5bd854e5", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.8198933388351799, "ground_truth": 0}, {"key": "f70a7abb6c5b0ef383ea12a4d9ca046a5bd854e5", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.7905303072121135, "ground_truth": 0}, {"key": "a3dd38ec7bc9d7e8423b96d8fd0641a2a5d5c984", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.8947894666824296, "ground_truth": 0}, {"key": "a3dd38ec7bc9d7e8423b96d8fd0641a2a5d5c984", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.9136765219812063, "ground_truth": 0}, {"key": "a3dd38ec7bc9d7e8423b96d8fd0641a2a5d5c984", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.9224823384151707, "ground_truth": 0}, {"key": "a3dd38ec7bc9d7e8423b96d8fd0641a2a5d5c984", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.9019206785873153, "ground_truth": 0}, {"key": "a3dd38ec7bc9d7e8423b96d8fd0641a2a5d5c984", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.876634387532889, "ground_truth": 0}, {"key": "654c6b29b96d2a5a818d91400c20f838b0e8b6df", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.7106282989355076, "ground_truth": 0}, {"key": "654c6b29b96d2a5a818d91400c20f838b0e8b6df", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.7786493021931689, "ground_truth": 0}, {"key": "654c6b29b96d2a5a818d91400c20f838b0e8b6df", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.8175744664339365, "ground_truth": 0}, {"key": "654c6b29b96d2a5a818d91400c20f838b0e8b6df", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.7943849597785587, "ground_truth": 0}, {"key": "654c6b29b96d2a5a818d91400c20f838b0e8b6df", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.7606506674251019, "ground_truth": 0}, {"key": "764d9ce99a1e3f79d95fbc4b68adbce14e7f8bcd", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.9532750421587864, "ground_truth": 0}, {"key": "764d9ce99a1e3f79d95fbc4b68adbce14e7f8bcd", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.964855153467606, "ground_truth": 0}, {"key": "764d9ce99a1e3f79d95fbc4b68adbce14e7f8bcd", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.8887587820699062, "ground_truth": 0}, {"key": "764d9ce99a1e3f79d95fbc4b68adbce14e7f8bcd", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.9319595785941085, "ground_truth": 0}, {"key": "764d9ce99a1e3f79d95fbc4b68adbce14e7f8bcd", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.9268352803517378, "ground_truth": 0}, {"key": "f16446db34e2861f0450dfa34d8cdda541ab7b19", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.8864204142209418, "ground_truth": 0}, {"key": "f16446db34e2861f0450dfa34d8cdda541ab7b19", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.8624675340892144, "ground_truth": 0}, {"key": "f16446db34e2861f0450dfa34d8cdda541ab7b19", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.8529354779581254, "ground_truth": 0}, {"key": "f16446db34e2861f0450dfa34d8cdda541ab7b19", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.8278281482538279, "ground_truth": 0}, {"key": "f16446db34e2861f0450dfa34d8cdda541ab7b19", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.8539127438503207, "ground_truth": 0}, {"key": "3e910c5b8425cd7c871a402a32ca44680b53ce5e", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.7799928997729397, "ground_truth": 0}, {"key": "3e910c5b8425cd7c871a402a32ca44680b53ce5e", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.854884640516332, "ground_truth": 0}, {"key": "3e910c5b8425cd7c871a402a32ca44680b53ce5e", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.7634837725757235, "ground_truth": 0}, {"key": "3e910c5b8425cd7c871a402a32ca44680b53ce5e", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.7201714976229424, "ground_truth": 0}, {"key": "3e910c5b8425cd7c871a402a32ca44680b53ce5e", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.8092759749372198, "ground_truth": 0}, {"key": "973c14551fc97a1eef094bd0f33356d9e6836234", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.804405902169202, "ground_truth": 0}, {"key": "973c14551fc97a1eef094bd0f33356d9e6836234", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.7853085854771006, "ground_truth": 0}, {"key": "973c14551fc97a1eef094bd0f33356d9e6836234", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.815232490492366, "ground_truth": 0}, {"key": "973c14551fc97a1eef094bd0f33356d9e6836234", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.8198933414148739, "ground_truth": 0}, {"key": "973c14551fc97a1eef094bd0f33356d9e6836234", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.7386690783375606, "ground_truth": 0}, {"key": "725938611c7dca6f876ada93b1d68b29ad25ce38", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.80563218244678, "ground_truth": 0}, {"key": "725938611c7dca6f876ada93b1d68b29ad25ce38", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.873214827129453, "ground_truth": 0}, {"key": "725938611c7dca6f876ada93b1d68b29ad25ce38", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.7853085954773137, "ground_truth": 0}, {"key": "725938611c7dca6f876ada93b1d68b29ad25ce38", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.8509646982676621, "ground_truth": 0}, {"key": "725938611c7dca6f876ada93b1d68b29ad25ce38", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.7839884628053306, "ground_truth": 0}, {"key": "28dbcf0c8624d9914a4e4292f872f17b063547c2", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.9105453989543093, "ground_truth": 0}, {"key": "28dbcf0c8624d9914a4e4292f872f17b063547c2", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.8955226810353168, "ground_truth": 0}, {"key": "28dbcf0c8624d9914a4e4292f872f17b063547c2", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.8587185939297306, "ground_truth": 0}, {"key": "28dbcf0c8624d9914a4e4292f872f17b063547c2", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.9155072441975819, "ground_truth": 0}, {"key": "28dbcf0c8624d9914a4e4292f872f17b063547c2", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.9219218436138097, "ground_truth": 0}, {"key": "4567b2098569ee4346cfdede5819257af4ee9c0f", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.955651419703228, "ground_truth": 0}, {"key": "4567b2098569ee4346cfdede5819257af4ee9c0f", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.90465053775846, "ground_truth": 0}, {"key": "4567b2098569ee4346cfdede5819257af4ee9c0f", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.9284087991808541, "ground_truth": 0}, {"key": "4567b2098569ee4346cfdede5819257af4ee9c0f", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.9403530567133155, "ground_truth": 0}, {"key": "4567b2098569ee4346cfdede5819257af4ee9c0f", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.9118099591848856, "ground_truth": 0}, {"key": "d0404188997ef57e0355b18fb867599b89c80407", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.7826624774034852, "ground_truth": 0}, {"key": "d0404188997ef57e0355b18fb867599b89c80407", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.888758800420644, "ground_truth": 0}, {"key": "d0404188997ef57e0355b18fb867599b89c80407", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.7772998583430069, "ground_truth": 0}, {"key": "d0404188997ef57e0355b18fb867599b89c80407", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.8376199685796093, "ground_truth": 0}, {"key": "d0404188997ef57e0355b18fb867599b89c80407", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.7918210654310491, "ground_truth": 0}, {"key": "ab10b3f8c4a6cca7aea94298447b13bc0721fe69", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.9543079660624495, "ground_truth": 0}, {"key": "ab10b3f8c4a6cca7aea94298447b13bc0721fe69", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.9381240058237786, "ground_truth": 0}, {"key": "ab10b3f8c4a6cca7aea94298447b13bc0721fe69", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.9529258230442115, "ground_truth": 0}, {"key": "ab10b3f8c4a6cca7aea94298447b13bc0721fe69", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.9462003542738457, "ground_truth": 0}, {"key": "ab10b3f8c4a6cca7aea94298447b13bc0721fe69", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.9178933729999741, "ground_truth": 0}, {"key": "7c11a3353593edde95bae0ee6178fb1d1855baed", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.560252684719771, "ground_truth": 0}, {"key": "7c11a3353593edde95bae0ee6178fb1d1855baed", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.7994423169780621, "ground_truth": 0}, {"key": "7c11a3353593edde95bae0ee6178fb1d1855baed", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.5544704636143961, "ground_truth": 0}, {"key": "7c11a3353593edde95bae0ee6178fb1d1855baed", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.7853085877790882, "ground_truth": 0}, {"key": "7c11a3353593edde95bae0ee6178fb1d1855baed", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.7505527638190955, "ground_truth": 0}, {"key": "487b272b94a620f9660e89bbf6ebab3ffdf1bf06", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.7662936346874828, "ground_truth": 0}, {"key": "487b272b94a620f9660e89bbf6ebab3ffdf1bf06", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.7813306312668112, "ground_truth": 0}, {"key": "487b272b94a620f9660e89bbf6ebab3ffdf1bf06", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.6424324935977513, "ground_truth": 0}, {"key": "487b272b94a620f9660e89bbf6ebab3ffdf1bf06", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.69264198507895, "ground_truth": 0}, {"key": "487b272b94a620f9660e89bbf6ebab3ffdf1bf06", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.763483771916178, "ground_truth": 0}, {"key": "e1b6f4701835710d3f518729188754fcd7061289", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.8499711799965487, "ground_truth": 0}, {"key": "e1b6f4701835710d3f518729188754fcd7061289", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.7505527794468985, "ground_truth": 0}, {"key": "e1b6f4701835710d3f518729188754fcd7061289", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.7772998616102619, "ground_truth": 0}, {"key": "e1b6f4701835710d3f518729188754fcd7061289", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.8832359929314518, "ground_truth": 0}, {"key": "e1b6f4701835710d3f518729188754fcd7061289", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.7892337029353712, "ground_truth": 0}, {"key": "45027afbe54056c567ca8a48906dd06200f6d8c1", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.9795114468327305, "ground_truth": 0}, {"key": "45027afbe54056c567ca8a48906dd06200f6d8c1", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.9755769078491723, "ground_truth": 0}, {"key": "45027afbe54056c567ca8a48906dd06200f6d8c1", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.9771973617747195, "ground_truth": 0}, {"key": "45027afbe54056c567ca8a48906dd06200f6d8c1", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.9683812334192566, "ground_truth": 0}, {"key": "45027afbe54056c567ca8a48906dd06200f6d8c1", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.9869795099140833, "ground_truth": 0}, {"key": "e8c2d4a1d20efb0606506435ebcbf486e9eb4146", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.8116760117918908, "ground_truth": 0}, {"key": "e8c2d4a1d20efb0606506435ebcbf486e9eb4146", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.921357620004271, "ground_truth": 0}, {"key": "e8c2d4a1d20efb0606506435ebcbf486e9eb4146", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.8104789005434613, "ground_truth": 0}, {"key": "e8c2d4a1d20efb0606506435ebcbf486e9eb4146", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.927887803446071, "ground_truth": 0}, {"key": "e8c2d4a1d20efb0606506435ebcbf486e9eb4146", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.9329437112811807, "ground_truth": 0}, {"key": "da0ea6b7eae20528c7ec822fb77d8e8f78ba09b8", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.9026096040975158, "ground_truth": 0}, {"key": "da0ea6b7eae20528c7ec822fb77d8e8f78ba09b8", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.887984042215267, "ground_truth": 0}, {"key": "da0ea6b7eae20528c7ec822fb77d8e8f78ba09b8", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.9130583415100423, "ground_truth": 0}, {"key": "da0ea6b7eae20528c7ec822fb77d8e8f78ba09b8", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.8558511430904984, "ground_truth": 0}, {"key": "da0ea6b7eae20528c7ec822fb77d8e8f78ba09b8", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.8615382093826162, "ground_truth": 0}, {"key": "42ab0385b3bb93236804c2abc9ff261b6ec79872", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.7956581118025882, "ground_truth": 0}, {"key": "42ab0385b3bb93236804c2abc9ff261b6ec79872", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.7490872248065351, "ground_truth": 0}, {"key": "42ab0385b3bb93236804c2abc9ff261b6ec79872", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.7931059645075889, "ground_truth": 0}, {"key": "42ab0385b3bb93236804c2abc9ff261b6ec79872", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.7356416460598247, "ground_truth": 0}, {"key": "42ab0385b3bb93236804c2abc9ff261b6ec79872", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.7386690642444662, "ground_truth": 0}, {"key": "3ad31f0dd26f2dce06da1c10ced8d601bd5594c5", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.734119518889015, "ground_truth": 0}, {"key": "3ad31f0dd26f2dce06da1c10ced8d601bd5594c5", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.8558511308328128, "ground_truth": 0}, {"key": "3ad31f0dd26f2dce06da1c10ced8d601bd5594c5", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.8661325109459492, "ground_truth": 0}, {"key": "3ad31f0dd26f2dce06da1c10ced8d601bd5594c5", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.67747400839134, "ground_truth": 0}, {"key": "3ad31f0dd26f2dce06da1c10ced8d601bd5594c5", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.806852627073949, "ground_truth": 0}, {"key": "a142b867b5b52449a790e8a2942654fd880cd2e4", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.9433475807792279, "ground_truth": 0}, {"key": "a142b867b5b52449a790e8a2942654fd880cd2e4", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.9556514249484382, "ground_truth": 0}, {"key": "a142b867b5b52449a790e8a2942654fd880cd2e4", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.9079671451023278, "ground_truth": 0}, {"key": "a142b867b5b52449a790e8a2942654fd880cd2e4", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.9039745116782223, "ground_truth": 0}, {"key": "a142b867b5b52449a790e8a2942654fd880cd2e4", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.9334308135486399, "ground_truth": 0}, {"key": "04b39ee42fdc4284e402fbf7cdc7b825748f38b5", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.924141823838978, "ground_truth": 0}, {"key": "04b39ee42fdc4284e402fbf7cdc7b825748f38b5", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.89405171423259, "ground_truth": 0}, {"key": "04b39ee42fdc4284e402fbf7cdc7b825748f38b5", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.8558511504746353, "ground_truth": 0}, {"key": "04b39ee42fdc4284e402fbf7cdc7b825748f38b5", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.856812310415746, "ground_truth": 0}, {"key": "04b39ee42fdc4284e402fbf7cdc7b825748f38b5", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.9202179905582969, "ground_truth": 0}, {"key": "ddafab36467762e9f1856687a7ef0e801243dace", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.7401743455275264, "ground_truth": 0}, {"key": "ddafab36467762e9f1856687a7ef0e801243dace", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.8175744760567623, "ground_truth": 0}, {"key": "ddafab36467762e9f1856687a7ef0e801243dace", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.8311430483908656, "ground_truth": 0}, {"key": "ddafab36467762e9f1856687a7ef0e801243dace", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.8140527919872033, "ground_truth": 0}, {"key": "ddafab36467762e9f1856687a7ef0e801243dace", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.8933094064408037, "ground_truth": 0}, {"key": "6c177720c8623edcaefc45111018f98811c29693", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.7505527678563132, "ground_truth": 0}, {"key": "6c177720c8623edcaefc45111018f98811c29693", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.8438950935736916, "ground_truth": 0}, {"key": "6c177720c8623edcaefc45111018f98811c29693", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.8783142450049316, "ground_truth": 0}, {"key": "6c177720c8623edcaefc45111018f98811c29693", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.9161096124322554, "ground_truth": 0}, {"key": "6c177720c8623edcaefc45111018f98811c29693", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.8548846447938837, "ground_truth": 0}, {"key": "5365dfc7c7079ade7d090530f5ce0d8995a8f1cc", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.8479677587634142, "ground_truth": 0}, {"key": "5365dfc7c7079ade7d090530f5ce0d8995a8f1cc", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.8887587918680174, "ground_truth": 0}, {"key": "5365dfc7c7079ade7d090530f5ce0d8995a8f1cc", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.8998277801452832, "ground_truth": 0}, {"key": "5365dfc7c7079ade7d090530f5ce0d8995a8f1cc", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.9155072423731513, "ground_truth": 0}, {"key": "5365dfc7c7079ade7d090530f5ce0d8995a8f1cc", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.8606036163804598, "ground_truth": 0}, {"key": "6235695e9e69aa35c488636fc63bae84d1e2ca1f", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.9294404051958957, "ground_truth": 0}, {"key": "6235695e9e69aa35c488636fc63bae84d1e2ca1f", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.8976952945685055, "ground_truth": 0}, {"key": "6235695e9e69aa35c488636fc63bae84d1e2ca1f", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.8210440924684991, "ground_truth": 0}, {"key": "6235695e9e69aa35c488636fc63bae84d1e2ca1f", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.9299510376389908, "ground_truth": 0}, {"key": "6235695e9e69aa35c488636fc63bae84d1e2ca1f", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.8774767851432153, "ground_truth": 0}, {"key": "d954f33da49f4c839a6f4dadc446a4c30328c572", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.8991213878766328, "ground_truth": 0}, {"key": "d954f33da49f4c839a6f4dadc446a4c30328c572", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.9289263250031959, "ground_truth": 0}, {"key": "d954f33da49f4c839a6f4dadc446a4c30328c572", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.8233283903190867, "ground_truth": 0}, {"key": "d954f33da49f4c839a6f4dadc446a4c30328c572", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.9167080797067567, "ground_truth": 0}, {"key": "d954f33da49f4c839a6f4dadc446a4c30328c572", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.8791467612315387, "ground_truth": 0}, {"key": "5bdab1456ce6156a7378edaa4fa92a718cbf2568", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.8705972752366457, "ground_truth": 0}, {"key": "5bdab1456ce6156a7378edaa4fa92a718cbf2568", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.9213576188427458, "ground_truth": 0}, {"key": "5bdab1456ce6156a7378edaa4fa92a718cbf2568", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.8624675354297735, "ground_truth": 0}, {"key": "5bdab1456ce6156a7378edaa4fa92a718cbf2568", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.8333246057602652, "ground_truth": 0}, {"key": "5bdab1456ce6156a7378edaa4fa92a718cbf2568", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.8991213769296992, "ground_truth": 0}, {"key": "c03cd67baa8d84240b962876a5aaa2036d4f5275", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.8289388109469814, "ground_truth": 0}, {"key": "c03cd67baa8d84240b962876a5aaa2036d4f5275", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.8152324942218327, "ground_truth": 0}, {"key": "c03cd67baa8d84240b962876a5aaa2036d4f5275", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.774583385415644, "ground_truth": 0}, {"key": "c03cd67baa8d84240b962876a5aaa2036d4f5275", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.732591824484622, "ground_truth": 0}, {"key": "c03cd67baa8d84240b962876a5aaa2036d4f5275", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.8397339600373281, "ground_truth": 0}, {"key": "e2847808e1990f51cd54eccd660640c44638f088", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.6757646130564973, "ground_truth": 0}, {"key": "e2847808e1990f51cd54eccd660640c44638f088", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.8539127524688078, "ground_truth": 0}, {"key": "e2847808e1990f51cd54eccd660640c44638f088", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.8289388149784354, "ground_truth": 0}, {"key": "e2847808e1990f51cd54eccd660640c44638f088", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.7025300405140212, "ground_truth": 0}, {"key": "e2847808e1990f51cd54eccd660640c44638f088", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.6992544214010918, "ground_truth": 0}, {"key": "fbc2d5f3f088eda2b8128ebb12a042850f6e4f3d", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.9202179792723724, "ground_truth": 0}, {"key": "fbc2d5f3f088eda2b8128ebb12a042850f6e4f3d", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.9294403992731213, "ground_truth": 0}, {"key": "fbc2d5f3f088eda2b8128ebb12a042850f6e4f3d", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.9173026615505875, "ground_truth": 0}, {"key": "fbc2d5f3f088eda2b8128ebb12a042850f6e4f3d", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.8615382113660944, "ground_truth": 0}, {"key": "fbc2d5f3f088eda2b8128ebb12a042850f6e4f3d", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.9416541632915226, "ground_truth": 0}, {"key": "6f0d219aba6227e0a69e71e7fca4b85ae761101d", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.9278878015822464, "ground_truth": 0}, {"key": "6f0d219aba6227e0a69e71e7fca4b85ae761101d", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.8688267762972283, "ground_truth": 0}, {"key": "6f0d219aba6227e0a69e71e7fca4b85ae761101d", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.885631482714194, "ground_truth": 0}, {"key": "6f0d219aba6227e0a69e71e7fca4b85ae761101d", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.8175744702143574, "ground_truth": 0}, {"key": "6f0d219aba6227e0a69e71e7fca4b85ae761101d", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.9241418195201349, "ground_truth": 0}, {"key": "8c71492f2a3fbe7eb9c8205d65054ab14c1dbdb6", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.8489721918327992, "ground_truth": 0}, {"key": "8c71492f2a3fbe7eb9c8205d65054ab14c1dbdb6", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.859663748221379, "ground_truth": 0}, {"key": "8c71492f2a3fbe7eb9c8205d65054ab14c1dbdb6", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.9690910449624022, "ground_truth": 0}, {"key": "8c71492f2a3fbe7eb9c8205d65054ab14c1dbdb6", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.9167080736848275, "ground_truth": 0}, {"key": "8c71492f2a3fbe7eb9c8205d65054ab14c1dbdb6", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.9196425298271647, "ground_truth": 0}, {"key": "860cea3a6afb8527d26e9234ccba560a39eff2a7", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.9575961718856548, "ground_truth": 0}, {"key": "860cea3a6afb8527d26e9234ccba560a39eff2a7", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.8887587833632948, "ground_truth": 0}, {"key": "860cea3a6afb8527d26e9234ccba560a39eff2a7", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.9348724480235874, "ground_truth": 0}, {"key": "860cea3a6afb8527d26e9234ccba560a39eff2a7", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.9294403994881911, "ground_truth": 0}, {"key": "860cea3a6afb8527d26e9234ccba560a39eff2a7", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.9155072413310228, "ground_truth": 0}, {"key": "0914e3c80a676e14e225504cb759103503f3f1e0", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.9086178946260159, "ground_truth": 0}, {"key": "0914e3c80a676e14e225504cb759103503f3f1e0", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.8757869953191487, "ground_truth": 0}, {"key": "0914e3c80a676e14e225504cb759103503f3f1e0", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.9019206673561516, "ground_truth": 0}, {"key": "0914e3c80a676e14e225504cb759103503f3f1e0", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.8895288600902169, "ground_truth": 0}, {"key": "0914e3c80a676e14e225504cb759103503f3f1e0", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.8856314689776302, "ground_truth": 0}, {"key": "82a0e1f034174079179821b052f33df76c781b47", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.8807970818019547, "ground_truth": 0}, {"key": "82a0e1f034174079179821b052f33df76c781b47", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.9149009564037935, "ground_truth": 0}, {"key": "82a0e1f034174079179821b052f33df76c781b47", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.9167080734161994, "ground_truth": 0}, {"key": "82a0e1f034174079179821b052f33df76c781b47", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.8633916093644154, "ground_truth": 0}, {"key": "82a0e1f034174079179821b052f33df76c781b47", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.8774767860208131, "ground_truth": 0}, {"key": "449c536051eba7070b18a7b33ebcf024891cb913", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.8128673144496141, "ground_truth": 0}, {"key": "449c536051eba7070b18a7b33ebcf024891cb913", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.8244619323698292, "ground_truth": 0}, {"key": "449c536051eba7070b18a7b33ebcf024891cb913", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.9485372358653438, "ground_truth": 0}, {"key": "449c536051eba7070b18a7b33ebcf024891cb913", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.8969755702182575, "ground_truth": 0}, {"key": "449c536051eba7070b18a7b33ebcf024891cb913", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.883235987523917, "ground_truth": 0}, {"key": "696d5716c42ab1096cdb464da3cfcf702626a62a", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.982557515276269, "ground_truth": 0}, {"key": "696d5716c42ab1096cdb464da3cfcf702626a62a", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.9810219628789815, "ground_truth": 0}, {"key": "696d5716c42ab1096cdb464da3cfcf702626a62a", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.9820137889366104, "ground_truth": 0}, {"key": "696d5716c42ab1096cdb464da3cfcf702626a62a", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.9768465894488353, "ground_truth": 0}, {"key": "696d5716c42ab1096cdb464da3cfcf702626a62a", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.9843363506583693, "ground_truth": 0}, {"key": "316f0f847800fdb547f7496f6095075cd610c7e4", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.9732407175867237, "ground_truth": 0}, {"key": "316f0f847800fdb547f7496f6095075cd610c7e4", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.9810219636097532, "ground_truth": 0}, {"key": "316f0f847800fdb547f7496f6095075cd610c7e4", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.9742394417110827, "ground_truth": 0}, {"key": "316f0f847800fdb547f7496f6095075cd610c7e4", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.9884918504654763, "ground_truth": 0}, {"key": "316f0f847800fdb547f7496f6095075cd610c7e4", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.9722043747591386, "ground_truth": 0}, {"key": "28e251ea722829df08d63e83824110fedcc13f8c", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.8902942234113392, "ground_truth": 0}, {"key": "28e251ea722829df08d63e83824110fedcc13f8c", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.9207896823941304, "ground_truth": 0}, {"key": "28e251ea722829df08d63e83824110fedcc13f8c", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.9353465140903006, "ground_truth": 0}, {"key": "28e251ea722829df08d63e83824110fedcc13f8c", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.8783142543611332, "ground_truth": 0}, {"key": "28e251ea722829df08d63e83824110fedcc13f8c", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.9059898184310627, "ground_truth": 0}, {"key": "4812698545d6a4c2243db340fad08d0b3b7fbe0b", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.9353465128650164, "ground_truth": 0}, {"key": "4812698545d6a4c2243db340fad08d0b3b7fbe0b", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.9149009623900671, "ground_truth": 0}, {"key": "4812698545d6a4c2243db340fad08d0b3b7fbe0b", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.8757869951143749, "ground_truth": 0}, {"key": "4812698545d6a4c2243db340fad08d0b3b7fbe0b", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.8984105568732156, "ground_truth": 0}, {"key": "4812698545d6a4c2243db340fad08d0b3b7fbe0b", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.9178933674632854, "ground_truth": 0}, {"key": "81651fc015f2db10f24327d11b1a3748a19466f9", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.8418256418449293, "ground_truth": 0}, {"key": "81651fc015f2db10f24327d11b1a3748a19466f9", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.8816149057526615, "ground_truth": 0}, {"key": "81651fc015f2db10f24327d11b1a3748a19466f9", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.8757869960267426, "ground_truth": 0}, {"key": "81651fc015f2db10f24327d11b1a3748a19466f9", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.8519528071534689, "ground_truth": 0}, {"key": "81651fc015f2db10f24327d11b1a3748a19466f9", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.8187367969988943, "ground_truth": 0}, {"key": "f85e12129885fad0eabd6a1c6b6b24dbf8948db5", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.8984105511056996, "ground_truth": 0}, {"key": "f85e12129885fad0eabd6a1c6b6b24dbf8948db5", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.9394706079137902, "ground_truth": 0}, {"key": "f85e12129885fad0eabd6a1c6b6b24dbf8948db5", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.8872046036644903, "ground_truth": 0}, {"key": "f85e12129885fad0eabd6a1c6b6b24dbf8948db5", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.8783142507905842, "ground_truth": 0}, {"key": "f85e12129885fad0eabd6a1c6b6b24dbf8948db5", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.8955226768424682, "ground_truth": 0}, {"key": "bffa402002700855fec36f83c8c226dfe271a6af", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.7505527640723931, "ground_truth": 0}, {"key": "bffa402002700855fec36f83c8c226dfe271a6af", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.7994423274329978, "ground_truth": 0}, {"key": "bffa402002700855fec36f83c8c226dfe271a6af", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.8044059038580833, "ground_truth": 0}, {"key": "bffa402002700855fec36f83c8c226dfe271a6af", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.8255897252947513, "ground_truth": 0}, {"key": "bffa402002700855fec36f83c8c226dfe271a6af", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.7943849668795829, "ground_truth": 0}, {"key": "360df256327edcaf7ce0b99314adec8b0a2c5be6", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.7813306302545031, "ground_truth": 0}, {"key": "360df256327edcaf7ce0b99314adec8b0a2c5be6", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.8068526200240914, "ground_truth": 0}, {"key": "360df256327edcaf7ce0b99314adec8b0a2c5be6", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.9184802509776473, "ground_truth": 0}, {"key": "360df256327edcaf7ce0b99314adec8b0a2c5be6", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.8006920026320392, "ground_truth": 0}, {"key": "360df256327edcaf7ce0b99314adec8b0a2c5be6", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.8175744820688868, "ground_truth": 0}, {"key": "35ae4229bbd571d86bb817df03b3784dc8cbf660", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.9099070072208544, "ground_truth": 0}, {"key": "35ae4229bbd571d86bb817df03b3784dc8cbf660", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.8976952956524114, "ground_truth": 0}, {"key": "35ae4229bbd571d86bb817df03b3784dc8cbf660", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.8791467720152201, "ground_truth": 0}, {"key": "35ae4229bbd571d86bb817df03b3784dc8cbf660", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.8577681067475403, "ground_truth": 0}, {"key": "35ae4229bbd571d86bb817df03b3784dc8cbf660", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.9230391661652388, "ground_truth": 0}, {"key": "fd93b423a3805de1c259d527393fd5fb75d06a55", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.6548947271149382, "ground_truth": 0}, {"key": "fd93b423a3805de1c259d527393fd5fb75d06a55", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.7648916143169139, "ground_truth": 0}, {"key": "fd93b423a3805de1c259d527393fd5fb75d06a55", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.689305613419721, "ground_truth": 0}, {"key": "fd93b423a3805de1c259d527393fd5fb75d06a55", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.8044059193438702, "ground_truth": 0}, {"key": "fd93b423a3805de1c259d527393fd5fb75d06a55", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.8128673146913762, "ground_truth": 0}, {"key": "646676aabe72e75add3cde2d6afa56cea64c91a4", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.8624675427839019, "ground_truth": 0}, {"key": "646676aabe72e75add3cde2d6afa56cea64c91a4", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.8365545559900113, "ground_truth": 0}, {"key": "646676aabe72e75add3cde2d6afa56cea64c91a4", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.9184802456042245, "ground_truth": 0}, {"key": "646676aabe72e75add3cde2d6afa56cea64c91a4", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.8925625256081343, "ground_truth": 0}, {"key": "646676aabe72e75add3cde2d6afa56cea64c91a4", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.7905303195233826, "ground_truth": 0}, {"key": "5acf12b2ef7771fd1cd1421acb7057d9a64be818", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.7732163579933277, "ground_truth": 0}, {"key": "5acf12b2ef7771fd1cd1421acb7057d9a64be818", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.8670357596329689, "ground_truth": 0}, {"key": "5acf12b2ef7771fd1cd1421acb7057d9a64be818", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.9066531190021048, "ground_truth": 0}, {"key": "5acf12b2ef7771fd1cd1421acb7057d9a64be818", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.8469578451918046, "ground_truth": 0}, {"key": "5acf12b2ef7771fd1cd1421acb7057d9a64be818", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.9012274187403944, "ground_truth": 0}, {"key": "0239342f05436085947bd0c5173a4636ee772b51", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.8807970735392333, "ground_truth": 0}, {"key": "0239342f05436085947bd0c5173a4636ee772b51", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.867035758774577, "ground_truth": 0}, {"key": "0239342f05436085947bd0c5173a4636ee772b51", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.8499711747723305, "ground_truth": 0}, {"key": "0239342f05436085947bd0c5173a4636ee772b51", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.928408799919432, "ground_truth": 0}, {"key": "0239342f05436085947bd0c5173a4636ee772b51", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.8895288527510314, "ground_truth": 0}, {"key": "1f40e358077ff22078a4e91e5114c4f86a4d52db", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.9549844659584139, "ground_truth": 0}, {"key": "1f40e358077ff22078a4e91e5114c4f86a4d52db", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.9046505396070322, "ground_truth": 0}, {"key": "1f40e358077ff22078a4e91e5114c4f86a4d52db", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.9173026566292355, "ground_truth": 0}, {"key": "1f40e358077ff22078a4e91e5114c4f86a4d52db", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.9449947169279549, "ground_truth": 0}, {"key": "1f40e358077ff22078a4e91e5114c4f86a4d52db", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.9367494724175324, "ground_truth": 0}, {"key": "a8ac682f29acaad4b669781c39fb2804374b8b2b", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.6706083050805776, "ground_truth": 0}, {"key": "a8ac682f29acaad4b669781c39fb2804374b8b2b", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.7520125754115927, "ground_truth": 0}, {"key": "a8ac682f29acaad4b669781c39fb2804374b8b2b", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.7866228245371527, "ground_truth": 0}, {"key": "a8ac682f29acaad4b669781c39fb2804374b8b2b", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.8643104333857528, "ground_truth": 0}, {"key": "a8ac682f29acaad4b669781c39fb2804374b8b2b", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.7185943962215869, "ground_truth": 0}, {"key": "d4474ce9da725c1540ac826f3247f53d086808fb", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.7310585964029721, "ground_truth": 0}, {"key": "d4474ce9da725c1540ac826f3247f53d086808fb", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.7826624715431477, "ground_truth": 0}, {"key": "d4474ce9da725c1540ac826f3247f53d086808fb", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.5945512710446169, "ground_truth": 0}, {"key": "d4474ce9da725c1540ac826f3247f53d086808fb", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.735641642229717, "ground_truth": 0}, {"key": "d4474ce9da725c1540ac826f3247f53d086808fb", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.7905303151810139, "ground_truth": 0}, {"key": "e74db6d20c456740ecb7b295c8d24489fb4f436f", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.8984105532118009, "ground_truth": 0}, {"key": "e74db6d20c456740ecb7b295c8d24489fb4f436f", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.9155072430659394, "ground_truth": 0}, {"key": "e74db6d20c456740ecb7b295c8d24489fb4f436f", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.8998277829085733, "ground_truth": 0}, {"key": "e74db6d20c456740ecb7b295c8d24489fb4f436f", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.8633916062196695, "ground_truth": 0}, {"key": "e74db6d20c456740ecb7b295c8d24489fb4f436f", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.8606036255003096, "ground_truth": 0}, {"key": "d79b790edcc3f5088161445102a656ae4adb8ab1", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.9437636571712649, "ground_truth": 0}, {"key": "d79b790edcc3f5088161445102a656ae4adb8ab1", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.9412234411595364, "ground_truth": 0}, {"key": "d79b790edcc3f5088161445102a656ae4adb8ab1", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.9329437136186672, "ground_truth": 0}, {"key": "d79b790edcc3f5088161445102a656ae4adb8ab1", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.8832359896303414, "ground_truth": 0}, {"key": "d79b790edcc3f5088161445102a656ae4adb8ab1", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.9572778040595259, "ground_truth": 0}, {"key": "47f028dbf53e028eb6636c85d8b3ee0de6a1de7b", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.7325918181672398, "ground_truth": 0}, {"key": "47f028dbf53e028eb6636c85d8b3ee0de6a1de7b", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.7813306326891193, "ground_truth": 0}, {"key": "47f028dbf53e028eb6636c85d8b3ee0de6a1de7b", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.7839884759808611, "ground_truth": 0}, {"key": "47f028dbf53e028eb6636c85d8b3ee0de6a1de7b", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.771843515319888, "ground_truth": 0}, {"key": "47f028dbf53e028eb6636c85d8b3ee0de6a1de7b", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.791821079163085, "ground_truth": 0}, {"key": "5f7a869908e864b70e83282b289ed1274c1f7f0d", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.7279754321788712, "ground_truth": 0}, {"key": "5f7a869908e864b70e83282b289ed1274c1f7f0d", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.7620701053237366, "ground_truth": 0}, {"key": "5f7a869908e864b70e83282b289ed1274c1f7f0d", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.8080672097677343, "ground_truth": 0}, {"key": "5f7a869908e864b70e83282b289ed1274c1f7f0d", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.7170118611966798, "ground_truth": 0}, {"key": "5f7a869908e864b70e83282b289ed1274c1f7f0d", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.729519784476126, "ground_truth": 0}, {"key": "59a9e7cad1c4c873738dda62b7e7b39bc2553710", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.7918210639558698, "ground_truth": 0}, {"key": "59a9e7cad1c4c873738dda62b7e7b39bc2553710", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.7106283281374379, "ground_truth": 0}, {"key": "59a9e7cad1c4c873738dda62b7e7b39bc2553710", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.9086178944100232, "ground_truth": 0}, {"key": "59a9e7cad1c4c873738dda62b7e7b39bc2553710", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.8164063905535303, "ground_truth": 0}, {"key": "59a9e7cad1c4c873738dda62b7e7b39bc2553710", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.8397339685251474, "ground_truth": 0}, {"key": "c47db89f5f9de3e599e2947ab7940eb65be0b433", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.9039745101243297, "ground_truth": 0}, {"key": "c47db89f5f9de3e599e2947ab7940eb65be0b433", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.9284087981195864, "ground_truth": 0}, {"key": "c47db89f5f9de3e599e2947ab7940eb65be0b433", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.8864204189293532, "ground_truth": 0}, {"key": "c47db89f5f9de3e599e2947ab7940eb65be0b433", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.9241418208054782, "ground_truth": 0}, {"key": "c47db89f5f9de3e599e2947ab7940eb65be0b433", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.914900957134461, "ground_truth": 0}, {"key": "a74c3ff540cb154fc1294fd9d48b6a952329722b", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.8311430360452151, "ground_truth": 0}, {"key": "a74c3ff540cb154fc1294fd9d48b6a952329722b", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.9358173547048231, "ground_truth": 0}, {"key": "a74c3ff540cb154fc1294fd9d48b6a952329722b", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.9412234406596451, "ground_truth": 0}, {"key": "a74c3ff540cb154fc1294fd9d48b6a952329722b", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.8187367906531625, "ground_truth": 0}, {"key": "a74c3ff540cb154fc1294fd9d48b6a952329722b", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.9073122256020804, "ground_truth": 0}, {"key": "f5692f8e01389a631dadcb70cfd4be3ff0ae45d3", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.8289387866691543, "ground_truth": 0}, {"key": "f5692f8e01389a631dadcb70cfd4be3ff0ae45d3", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.8824278640357467, "ground_truth": 0}, {"key": "f5692f8e01389a631dadcb70cfd4be3ff0ae45d3", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.8766343815236476, "ground_truth": 0}, {"key": "f5692f8e01389a631dadcb70cfd4be3ff0ae45d3", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.8624675249375985, "ground_truth": 0}, {"key": "f5692f8e01389a631dadcb70cfd4be3ff0ae45d3", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.8596637562822789, "ground_truth": 0}, {"key": "467e1b592518a5660d0a3b7eda24ef9574fe0d11", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.8652240812793698, "ground_truth": 0}, {"key": "467e1b592518a5660d0a3b7eda24ef9574fe0d11", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.8740772258264619, "ground_truth": 0}, {"key": "467e1b592518a5660d0a3b7eda24ef9574fe0d11", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.9207896800180304, "ground_truth": 0}, {"key": "467e1b592518a5660d0a3b7eda24ef9574fe0d11", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.8740772275119943, "ground_truth": 0}, {"key": "467e1b592518a5660d0a3b7eda24ef9574fe0d11", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.8643104555057189, "ground_truth": 0}, {"key": "61acf6de75325370728f6e290bafb01adc24a3ca", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.7106283025317065, "ground_truth": 0}, {"key": "61acf6de75325370728f6e290bafb01adc24a3ca", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.6187804111593959, "ground_truth": 0}, {"key": "61acf6de75325370728f6e290bafb01adc24a3ca", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.5888891267155768, "ground_truth": 0}, {"key": "61acf6de75325370728f6e290bafb01adc24a3ca", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.4707366046282883, "ground_truth": 0}, {"key": "61acf6de75325370728f6e290bafb01adc24a3ca", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.642432519231291, "ground_truth": 0}, {"key": "172d2668b011501c20181b4925ebb6ba582f9a2f", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.9130583381248675, "ground_truth": 0}, {"key": "172d2668b011501c20181b4925ebb6ba582f9a2f", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.8816149003640805, "ground_truth": 0}, {"key": "172d2668b011501c20181b4925ebb6ba582f9a2f", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.8044059207330692, "ground_truth": 0}, {"key": "172d2668b011501c20181b4925ebb6ba582f9a2f", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.8766343858459842, "ground_truth": 0}, {"key": "172d2668b011501c20181b4925ebb6ba582f9a2f", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.8732148236854373, "ground_truth": 0}, {"key": "314c7c0104eb4113074619b3b3f1e9356114e2f5", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.9289263297772694, "ground_truth": 0}, {"key": "314c7c0104eb4113074619b3b3f1e9356114e2f5", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.9697854122561937, "ground_truth": 0}, {"key": "314c7c0104eb4113074619b3b3f1e9356114e2f5", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.9481545309801297, "ground_truth": 0}, {"key": "314c7c0104eb4113074619b3b3f1e9356114e2f5", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.9118099572163764, "ground_truth": 0}, {"key": "314c7c0104eb4113074619b3b3f1e9356114e2f5", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.9651191156310305, "ground_truth": 0}, {"key": "e66546893c2fa5fe38be74e1d1ed104f0c412b4d", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.707404715456606, "ground_truth": 0}, {"key": "e66546893c2fa5fe38be74e1d1ed104f0c412b4d", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.7931059640370369, "ground_truth": 0}, {"key": "e66546893c2fa5fe38be74e1d1ed104f0c412b4d", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.8187367915407058, "ground_truth": 0}, {"key": "e66546893c2fa5fe38be74e1d1ed104f0c412b4d", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.8187367884152356, "ground_truth": 0}, {"key": "e66546893c2fa5fe38be74e1d1ed104f0c412b4d", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.7154240082285624, "ground_truth": 0}, {"key": "04882672036936ca86bdebed819a133539cbd296", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.8652240772370478, "ground_truth": 0}, {"key": "04882672036936ca86bdebed819a133539cbd296", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.9268352815608428, "ground_truth": 0}, {"key": "04882672036936ca86bdebed819a133539cbd296", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.8624675195807305, "ground_truth": 0}, {"key": "04882672036936ca86bdebed819a133539cbd296", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.9142907250232123, "ground_truth": 0}, {"key": "04882672036936ca86bdebed819a133539cbd296", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.9073122235822927, "ground_truth": 0}, {"key": "d5342fb6d8d522f336f2ce34eaa6e62446c0da2e", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.8354835402973838, "ground_truth": 0}, {"key": "d5342fb6d8d522f336f2ce34eaa6e62446c0da2e", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.7505527647458419, "ground_truth": 0}, {"key": "d5342fb6d8d522f336f2ce34eaa6e62446c0da2e", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.8333245908418253, "ground_truth": 0}, {"key": "d5342fb6d8d522f336f2ce34eaa6e62446c0da2e", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.7185943841158831, "ground_truth": 0}, {"key": "d5342fb6d8d522f336f2ce34eaa6e62446c0da2e", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.8568122902190244, "ground_truth": 0}, {"key": "87cdc5b797032387ea9bd0c9a0d7fd57c088e65b", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.8509647066439278, "ground_truth": 0}, {"key": "87cdc5b797032387ea9bd0c9a0d7fd57c088e65b", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.80927596861937, "ground_truth": 0}, {"key": "87cdc5b797032387ea9bd0c9a0d7fd57c088e65b", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.7931059517352316, "ground_truth": 0}, {"key": "87cdc5b797032387ea9bd0c9a0d7fd57c088e65b", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.8840392903264443, "ground_truth": 0}, {"key": "87cdc5b797032387ea9bd0c9a0d7fd57c088e65b", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.8998277778664706, "ground_truth": 0}, {"key": "4fd3285b643696cd49f08c14b0d482e559f32eed", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.7549149893094412, "ground_truth": 0}, {"key": "4fd3285b643696cd49f08c14b0d482e559f32eed", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.6315943023685634, "ground_truth": 0}, {"key": "4fd3285b643696cd49f08c14b0d482e559f32eed", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.6566582650789838, "ground_truth": 0}, {"key": "4fd3285b643696cd49f08c14b0d482e559f32eed", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.770464783195419, "ground_truth": 0}, {"key": "4fd3285b643696cd49f08c14b0d482e559f32eed", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.5832033907384097, "ground_truth": 0}, {"key": "55930649e6f3cb285a26ef33525f8199bd86d089", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.8019358285930152, "ground_truth": 0}, {"key": "55930649e6f3cb285a26ef33525f8199bd86d089", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.8198933450232112, "ground_truth": 0}, {"key": "55930649e6f3cb285a26ef33525f8199bd86d089", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.8104788997378806, "ground_truth": 0}, {"key": "55930649e6f3cb285a26ef33525f8199bd86d089", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.841825637719606, "ground_truth": 0}, {"key": "55930649e6f3cb285a26ef33525f8199bd86d089", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.8918110443539987, "ground_truth": 0}, {"key": "8b1c9d7c48a0d857ae857a21395a4996de051915", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.8783142479689666, "ground_truth": 0}, {"key": "8b1c9d7c48a0d857ae857a21395a4996de051915", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.8670357512093381, "ground_truth": 0}, {"key": "8b1c9d7c48a0d857ae857a21395a4996de051915", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.8872045958902326, "ground_truth": 0}, {"key": "8b1c9d7c48a0d857ae857a21395a4996de051915", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.9207896835048448, "ground_truth": 0}, {"key": "8b1c9d7c48a0d857ae857a21395a4996de051915", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.8267117909025387, "ground_truth": 0}, {"key": "d95dce003f0fccc57742bd900c81897c45208c10", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.9453993926638294, "ground_truth": 0}, {"key": "d95dce003f0fccc57742bd900c81897c45208c10", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.9324533041980798, "ground_truth": 0}, {"key": "d95dce003f0fccc57742bd900c81897c45208c10", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.9348724497585067, "ground_truth": 0}, {"key": "d95dce003f0fccc57742bd900c81897c45208c10", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.9196425332500701, "ground_truth": 0}, {"key": "d95dce003f0fccc57742bd900c81897c45208c10", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.9469902275872377, "ground_truth": 0}, {"key": "f732a658c314c090257225483075e4d9fde28b95", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.9053223054530413, "ground_truth": 0}, {"key": "f732a658c314c090257225483075e4d9fde28b95", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.9039745106456561, "ground_truth": 0}, {"key": "f732a658c314c090257225483075e4d9fde28b95", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.925768637858537, "ground_truth": 0}, {"key": "f732a658c314c090257225483075e4d9fde28b95", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.8940517104020114, "ground_truth": 0}, {"key": "f732a658c314c090257225483075e4d9fde28b95", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.9213576194672687, "ground_truth": 0}, {"key": "cbd21ed724b7e4a075ab4ae9a45d9e86d6151283", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.7839884747473462, "ground_truth": 0}, {"key": "cbd21ed724b7e4a075ab4ae9a45d9e86d6151283", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.8568122949702076, "ground_truth": 0}, {"key": "cbd21ed724b7e4a075ab4ae9a45d9e86d6151283", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.7879311855800546, "ground_truth": 0}, {"key": "cbd21ed724b7e4a075ab4ae9a45d9e86d6151283", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.8233283873054409, "ground_truth": 0}, {"key": "cbd21ed724b7e4a075ab4ae9a45d9e86d6151283", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.8333245957591532, "ground_truth": 0}, {"key": "4a32d5f29cfb35f3a3966ee041fc1f358503f4b4", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.8816149049289134, "ground_truth": 0}, {"key": "4a32d5f29cfb35f3a3966ee041fc1f358503f4b4", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.9032941983910278, "ground_truth": 0}, {"key": "4a32d5f29cfb35f3a3966ee041fc1f358503f4b4", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.9073122295591516, "ground_truth": 0}, {"key": "4a32d5f29cfb35f3a3966ee041fc1f358503f4b4", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.9219218284758866, "ground_truth": 0}, {"key": "4a32d5f29cfb35f3a3966ee041fc1f358503f4b4", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.9190632967580472, "ground_truth": 0}, {"key": "d470c9860671ae720ccc7df115a46d471b4b900a", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.9818752784684468, "ground_truth": 0}, {"key": "d470c9860671ae720ccc7df115a46d471b4b900a", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.9796676462675442, "ground_truth": 0}, {"key": "d470c9860671ae720ccc7df115a46d471b4b900a", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.9778834091506244, "ground_truth": 0}, {"key": "d470c9860671ae720ccc7df115a46d471b4b900a", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.9704646627463805, "ground_truth": 0}, {"key": "d470c9860671ae720ccc7df115a46d471b4b900a", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.9778834113475465, "ground_truth": 0}, {"key": "55327ce32c4d5168e8e0fa7b5dabc9a8aafd9d78", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.8633915909937478, "ground_truth": 0}, {"key": "55327ce32c4d5168e8e0fa7b5dabc9a8aafd9d78", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.8895288554573166, "ground_truth": 0}, {"key": "55327ce32c4d5168e8e0fa7b5dabc9a8aafd9d78", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.803173790532036, "ground_truth": 0}, {"key": "55327ce32c4d5168e8e0fa7b5dabc9a8aafd9d78", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.8732148199775697, "ground_truth": 0}, {"key": "55327ce32c4d5168e8e0fa7b5dabc9a8aafd9d78", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.8577681180577226, "ground_truth": 0}, {"key": "022c18def42072e28a37979c622c6ab7e31371de", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.861538214877726, "ground_truth": 0}, {"key": "022c18def42072e28a37979c622c6ab7e31371de", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.8679338563621809, "ground_truth": 0}, {"key": "022c18def42072e28a37979c622c6ab7e31371de", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.8848377669874552, "ground_truth": 0}, {"key": "022c18def42072e28a37979c622c6ab7e31371de", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.867035764212143, "ground_truth": 0}, {"key": "022c18def42072e28a37979c622c6ab7e31371de", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.8955226890136261, "ground_truth": 0}, {"key": "d49c8ddc7586fcc27a7d310a5cb7703f19e4607d", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.8333246008785986, "ground_truth": 0}, {"key": "d49c8ddc7586fcc27a7d310a5cb7703f19e4607d", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.7969253886169653, "ground_truth": 0}, {"key": "d49c8ddc7586fcc27a7d310a5cb7703f19e4607d", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.8976952917396982, "ground_truth": 0}, {"key": "d49c8ddc7586fcc27a7d310a5cb7703f19e4607d", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.8872046012131412, "ground_truth": 0}, {"key": "d49c8ddc7586fcc27a7d310a5cb7703f19e4607d", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.9173026548941192, "ground_truth": 0}, {"key": "bda116dccb075585a67fd5dd5b759015c7577eb0", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.8596637514589548, "ground_truth": 0}, {"key": "bda116dccb075585a67fd5dd5b759015c7577eb0", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.8697145891583835, "ground_truth": 0}, {"key": "bda116dccb075585a67fd5dd5b759015c7577eb0", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.8774767918419156, "ground_truth": 0}, {"key": "bda116dccb075585a67fd5dd5b759015c7577eb0", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.7981867807825499, "ground_truth": 0}, {"key": "bda116dccb075585a67fd5dd5b759015c7577eb0", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.8661325152039968, "ground_truth": 0}, {"key": "ee0b1bc5ee40697c0792e3906000fe8be5be182a", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.8643104520420147, "ground_truth": 0}, {"key": "ee0b1bc5ee40697c0792e3906000fe8be5be182a", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.8267118010489156, "ground_truth": 0}, {"key": "ee0b1bc5ee40697c0792e3906000fe8be5be182a", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.9142907184430414, "ground_truth": 0}, {"key": "ee0b1bc5ee40697c0792e3906000fe8be5be182a", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.849971173536447, "ground_truth": 0}, {"key": "ee0b1bc5ee40697c0792e3906000fe8be5be182a", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.8596637527942381, "ground_truth": 0}, {"key": "75b0d4c21581a1b0c1fc5798adba334d8ecc34f3", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.8991213796661918, "ground_truth": 0}, {"key": "75b0d4c21581a1b0c1fc5798adba334d8ecc34f3", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.8991213883876049, "ground_truth": 0}, {"key": "75b0d4c21581a1b0c1fc5798adba334d8ecc34f3", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.9059898162990285, "ground_truth": 0}, {"key": "75b0d4c21581a1b0c1fc5798adba334d8ecc34f3", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.9026095997477901, "ground_truth": 0}, {"key": "75b0d4c21581a1b0c1fc5798adba334d8ecc34f3", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.8783142522077597, "ground_truth": 0}, {"key": "3f7e19cffef13f356e2298c5a63e6c8db20f3d91", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.6959583386836575, "ground_truth": 0}, {"key": "3f7e19cffef13f356e2298c5a63e6c8db20f3d91", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.8278281454215678, "ground_truth": 0}, {"key": "3f7e19cffef13f356e2298c5a63e6c8db20f3d91", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.8799743695815581, "ground_truth": 0}, {"key": "3f7e19cffef13f356e2298c5a63e6c8db20f3d91", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.8255897332770807, "ground_truth": 0}, {"key": "3f7e19cffef13f356e2298c5a63e6c8db20f3d91", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.8723473878534618, "ground_truth": 0}, {"key": "00359f516cdf8b1800c7102711bd9aa400d1c749", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.8714748645811978, "ground_truth": 0}, {"key": "00359f516cdf8b1800c7102711bd9aa400d1c749", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.8568122894632315, "ground_truth": 0}, {"key": "00359f516cdf8b1800c7102711bd9aa400d1c749", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.8816148986528389, "ground_truth": 0}, {"key": "00359f516cdf8b1800c7102711bd9aa400d1c749", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.7931059361249088, "ground_truth": 0}, {"key": "00359f516cdf8b1800c7102711bd9aa400d1c749", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.8438951031766196, "ground_truth": 0}, {"key": "f8be2f5ce06cb4af91cbb7b6bef9835991751ef5", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.8925625263549355, "ground_truth": 0}, {"key": "f8be2f5ce06cb4af91cbb7b6bef9835991751ef5", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.8723473852629364, "ground_truth": 0}, {"key": "f8be2f5ce06cb4af91cbb7b6bef9835991751ef5", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.8688267771879099, "ground_truth": 0}, {"key": "f8be2f5ce06cb4af91cbb7b6bef9835991751ef5", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.8606036098926827, "ground_truth": 0}, {"key": "f8be2f5ce06cb4af91cbb7b6bef9835991751ef5", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.8068526279408793, "ground_truth": 0}, {"key": "958a67b8550998886478275b404e2256a6b85c7c", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.8449215216676161, "ground_truth": 0}, {"key": "958a67b8550998886478275b404e2256a6b85c7c", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.8376199714011628, "ground_truth": 0}, {"key": "958a67b8550998886478275b404e2256a6b85c7c", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.876634383172631, "ground_truth": 0}, {"key": "958a67b8550998886478275b404e2256a6b85c7c", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.8210440949000597, "ground_truth": 0}, {"key": "958a67b8550998886478275b404e2256a6b85c7c", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.8652240786974187, "ground_truth": 0}, {"key": "4739f160c87994f52e894591194f5df06fed4c39", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.732591836278302, "ground_truth": 0}, {"key": "4739f160c87994f52e894591194f5df06fed4c39", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.7704647985874774, "ground_truth": 0}, {"key": "4739f160c87994f52e894591194f5df06fed4c39", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.7154239938493425, "ground_truth": 0}, {"key": "4739f160c87994f52e894591194f5df06fed4c39", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.7905303173341948, "ground_truth": 0}, {"key": "4739f160c87994f52e894591194f5df06fed4c39", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.8289388112230294, "ground_truth": 0}, {"key": "027a99a889b38fdb935cd14c204a5fca8a329bc1", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.6774740302204167, "ground_truth": 0}, {"key": "027a99a889b38fdb935cd14c204a5fca8a329bc1", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.6636689402968663, "ground_truth": 0}, {"key": "027a99a889b38fdb935cd14c204a5fca8a329bc1", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.7074046910098987, "ground_truth": 0}, {"key": "027a99a889b38fdb935cd14c204a5fca8a329bc1", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.793105940560479, "ground_truth": 0}, {"key": "027a99a889b38fdb935cd14c204a5fca8a329bc1", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.774583391702042, "ground_truth": 0}, {"key": "c7c83a9ee902e568a55898c616f20181952ce057", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.9105453945048237, "ground_truth": 0}, {"key": "c7c83a9ee902e568a55898c616f20181952ce057", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.9284087966442979, "ground_truth": 0}, {"key": "c7c83a9ee902e568a55898c616f20181952ce057", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.840782601304962, "ground_truth": 0}, {"key": "c7c83a9ee902e568a55898c616f20181952ce057", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.9184802469324549, "ground_truth": 0}, {"key": "c7c83a9ee902e568a55898c616f20181952ce057", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.9026096016280053, "ground_truth": 0}, {"key": "7bff6a60ff0b62855bd28562bb820233c0c940e0", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.8175744731151361, "ground_truth": 0}, {"key": "7bff6a60ff0b62855bd28562bb820233c0c940e0", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.7520125938691473, "ground_truth": 0}, {"key": "7bff6a60ff0b62855bd28562bb820233c0c940e0", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.7534666410149835, "ground_truth": 0}, {"key": "7bff6a60ff0b62855bd28562bb820233c0c940e0", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.803173799705929, "ground_truth": 0}, {"key": "7bff6a60ff0b62855bd28562bb820233c0c940e0", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.626124193043258, "ground_truth": 0}, {"key": "5ba5e49e25610f42416b2e7ba76d7496acab0f78", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.8969755691141238, "ground_truth": 0}, {"key": "5ba5e49e25610f42416b2e7ba76d7496acab0f78", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.8558511515878311, "ground_truth": 0}, {"key": "5ba5e49e25610f42416b2e7ba76d7496acab0f78", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.8895288566146694, "ground_truth": 0}, {"key": "5ba5e49e25610f42416b2e7ba76d7496acab0f78", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.8233283905274591, "ground_truth": 0}, {"key": "5ba5e49e25610f42416b2e7ba76d7496acab0f78", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.8864204211617396, "ground_truth": 0}, {"key": "0961a6a9fef7ad978ab866a57415578a49ba187f", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.8984105487575316, "ground_truth": 0}, {"key": "0961a6a9fef7ad978ab866a57415578a49ba187f", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.9039745113549879, "ground_truth": 0}, {"key": "0961a6a9fef7ad978ab866a57415578a49ba187f", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.8633915949418169, "ground_truth": 0}, {"key": "0961a6a9fef7ad978ab866a57415578a49ba187f", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.9594592627986271, "ground_truth": 0}, {"key": "0961a6a9fef7ad978ab866a57415578a49ba187f", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.9268352813309254, "ground_truth": 0}, {"key": "94148575d23050ffbedb00bddbd826d7137a4fe4", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.8606036153916692, "ground_truth": 0}, {"key": "94148575d23050ffbedb00bddbd826d7137a4fe4", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.8887587971731284, "ground_truth": 0}, {"key": "94148575d23050ffbedb00bddbd826d7137a4fe4", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.863391598016219, "ground_truth": 0}, {"key": "94148575d23050ffbedb00bddbd826d7137a4fe4", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.8670357525505096, "ground_truth": 0}, {"key": "94148575d23050ffbedb00bddbd826d7137a4fe4", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.8418256526001509, "ground_truth": 0}, {"key": "aaa346e0be1ef1b9c2ce152c859b30e364ea3bc0", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.9582261200331478, "ground_truth": 0}, {"key": "aaa346e0be1ef1b9c2ce152c859b30e364ea3bc0", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.9079671440138537, "ground_truth": 0}, {"key": "aaa346e0be1ef1b9c2ce152c859b30e364ea3bc0", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.8840392865859076, "ground_truth": 0}, {"key": "aaa346e0be1ef1b9c2ce152c859b30e364ea3bc0", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.9099070015228481, "ground_truth": 0}, {"key": "aaa346e0be1ef1b9c2ce152c859b30e364ea3bc0", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.9167080696340993, "ground_truth": 0}, {"key": "7604af04967436c4aaf0c7df8b09afcec82f5be0", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.8376199745506948, "ground_truth": 0}, {"key": "7604af04967436c4aaf0c7df8b09afcec82f5be0", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.8697145788120051, "ground_truth": 0}, {"key": "7604af04967436c4aaf0c7df8b09afcec82f5be0", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.8479677540614127, "ground_truth": 0}, {"key": "7604af04967436c4aaf0c7df8b09afcec82f5be0", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.8489721979064238, "ground_truth": 0}, {"key": "7604af04967436c4aaf0c7df8b09afcec82f5be0", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.8697145831895241, "ground_truth": 0}, {"key": "1be68b94413120c0b2c7514ffd14b9cfc4413f90", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.6187804344667678, "ground_truth": 0}, {"key": "1be68b94413120c0b2c7514ffd14b9cfc4413f90", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.7217432010761454, "ground_truth": 0}, {"key": "1be68b94413120c0b2c7514ffd14b9cfc4413f90", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.847967753741319, "ground_truth": 0}, {"key": "1be68b94413120c0b2c7514ffd14b9cfc4413f90", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.7549149879832596, "ground_truth": 0}, {"key": "1be68b94413120c0b2c7514ffd14b9cfc4413f90", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.8596637511039407, "ground_truth": 0}, {"key": "44fc3a2bc441a674f1ebdeabae73278977909db4", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.7634837629957024, "ground_truth": 0}, {"key": "44fc3a2bc441a674f1ebdeabae73278977909db4", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.799442318976265, "ground_truth": 0}, {"key": "44fc3a2bc441a674f1ebdeabae73278977909db4", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.7931059352511465, "ground_truth": 0}, {"key": "44fc3a2bc441a674f1ebdeabae73278977909db4", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.7520125796299161, "ground_truth": 0}, {"key": "44fc3a2bc441a674f1ebdeabae73278977909db4", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.8479677568434678, "ground_truth": 0}, {"key": "fbb06b75e3963c5a810c9f73e4dc5382fbcb7405", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.8872045996594403, "ground_truth": 0}, {"key": "fbb06b75e3963c5a810c9f73e4dc5382fbcb7405", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.8799743651883205, "ground_truth": 0}, {"key": "fbb06b75e3963c5a810c9f73e4dc5382fbcb7405", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.8933094094059103, "ground_truth": 0}, {"key": "fbb06b75e3963c5a810c9f73e4dc5382fbcb7405", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.9079671394200974, "ground_truth": 0}, {"key": "fbb06b75e3963c5a810c9f73e4dc5382fbcb7405", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.9299510387463069, "ground_truth": 0}, {"key": "551839469c1133ef4697ed435c5de192e6076858", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.9167080785853864, "ground_truth": 0}, {"key": "551839469c1133ef4697ed435c5de192e6076858", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.9263037302446028, "ground_truth": 0}, {"key": "551839469c1133ef4697ed435c5de192e6076858", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.8840392786463833, "ground_truth": 0}, {"key": "551839469c1133ef4697ed435c5de192e6076858", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.9202179809669583, "ground_truth": 0}, {"key": "551839469c1133ef4697ed435c5de192e6076858", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.9213576159805804, "ground_truth": 0}, {"key": "386e149797954c4b5cd52bcad0beece29f7eb04a", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.8376199682109364, "ground_truth": 0}, {"key": "386e149797954c4b5cd52bcad0beece29f7eb04a", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.7138307630309668, "ground_truth": 0}, {"key": "386e149797954c4b5cd52bcad0beece29f7eb04a", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.8376199774831433, "ground_truth": 0}, {"key": "386e149797954c4b5cd52bcad0beece29f7eb04a", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.6976089205133847, "ground_truth": 0}, {"key": "386e149797954c4b5cd52bcad0beece29f7eb04a", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.8244619307619027, "ground_truth": 0}, {"key": "25abfd6bf83eb62bdd4daf1f542d61b54ab2871d", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.8479677525302066, "ground_truth": 0}, {"key": "25abfd6bf83eb62bdd4daf1f542d61b54ab2871d", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.8887587902888336, "ground_truth": 0}, {"key": "25abfd6bf83eb62bdd4daf1f542d61b54ab2871d", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.8895288489725823, "ground_truth": 0}, {"key": "25abfd6bf83eb62bdd4daf1f542d61b54ab2871d", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.8864204088855931, "ground_truth": 0}, {"key": "25abfd6bf83eb62bdd4daf1f542d61b54ab2871d", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.8799743590291623, "ground_truth": 0}, {"key": "e5e0f9ea6381d513d4632644634d7c12e1c6c4cb", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.8606036262143576, "ground_truth": 0}, {"key": "e5e0f9ea6381d513d4632644634d7c12e1c6c4cb", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.8976952952495437, "ground_truth": 0}, {"key": "e5e0f9ea6381d513d4632644634d7c12e1c6c4cb", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.9142907157409832, "ground_truth": 0}, {"key": "e5e0f9ea6381d513d4632644634d7c12e1c6c4cb", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.877476795091614, "ground_truth": 0}, {"key": "e5e0f9ea6381d513d4632644634d7c12e1c6c4cb", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.8499711834764866, "ground_truth": 0}, {"key": "4e660c57fb36c03622b3ff9f9d0e78a0f7b0aea9", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.861538203506519, "ground_truth": 0}, {"key": "4e660c57fb36c03622b3ff9f9d0e78a0f7b0aea9", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.8175744756225227, "ground_truth": 0}, {"key": "4e660c57fb36c03622b3ff9f9d0e78a0f7b0aea9", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.7931059455625052, "ground_truth": 0}, {"key": "4e660c57fb36c03622b3ff9f9d0e78a0f7b0aea9", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.8661325056826129, "ground_truth": 0}, {"key": "4e660c57fb36c03622b3ff9f9d0e78a0f7b0aea9", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.8221891230216908, "ground_truth": 0}, {"key": "586458cf89c9c2ddc5a7925e275f135245f5a0fc", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.9124361604477871, "ground_truth": 0}, {"key": "586458cf89c9c2ddc5a7925e275f135245f5a0fc", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.8895288539177206, "ground_truth": 0}, {"key": "586458cf89c9c2ddc5a7925e275f135245f5a0fc", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.8577681124401277, "ground_truth": 0}, {"key": "586458cf89c9c2ddc5a7925e275f135245f5a0fc", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.9536217936038582, "ground_truth": 0}, {"key": "586458cf89c9c2ddc5a7925e275f135245f5a0fc", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.8976952934239393, "ground_truth": 0}, {"key": "8aca433d3662b6ffe76ef4026bdcd7cf784aacec", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.6706082821842042, "ground_truth": 0}, {"key": "8aca433d3662b6ffe76ef4026bdcd7cf784aacec", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.6442250936583418, "ground_truth": 0}, {"key": "8aca433d3662b6ffe76ef4026bdcd7cf784aacec", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.6740504830252626, "ground_truth": 0}, {"key": "8aca433d3662b6ffe76ef4026bdcd7cf784aacec", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.4590761354531368, "ground_truth": 0}, {"key": "8aca433d3662b6ffe76ef4026bdcd7cf784aacec", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.5717665869369742, "ground_truth": 0}, {"key": "066f8568d9c1c23ca3aeb23330123e7dd8967208", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.8766343782549698, "ground_truth": 0}, {"key": "066f8568d9c1c23ca3aeb23330123e7dd8967208", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.9372107929998372, "ground_truth": 0}, {"key": "066f8568d9c1c23ca3aeb23330123e7dd8967208", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.8428631472047411, "ground_truth": 0}, {"key": "066f8568d9c1c23ca3aeb23330123e7dd8967208", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.9012274145832975, "ground_truth": 0}, {"key": "066f8568d9c1c23ca3aeb23330123e7dd8967208", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.8902942253271786, "ground_truth": 0}, {"key": "6589398915f67576609586704d5bcca6538c4727", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.854884635027272, "ground_truth": 0}, {"key": "6589398915f67576609586704d5bcca6538c4727", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.741674011221046, "ground_truth": 0}, {"key": "6589398915f67576609586704d5bcca6538c4727", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.8766343694879124, "ground_truth": 0}, {"key": "6589398915f67576609586704d5bcca6538c4727", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.860603622823464, "ground_truth": 0}, {"key": "6589398915f67576609586704d5bcca6538c4727", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.876634371665074, "ground_truth": 0}, {"key": "cb4d9818866490b281e8f5529c9957ba366390e7", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.8376199672500251, "ground_truth": 0}, {"key": "cb4d9818866490b281e8f5529c9957ba366390e7", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.8255897279167582, "ground_truth": 0}, {"key": "cb4d9818866490b281e8f5529c9957ba366390e7", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.8438950881142246, "ground_truth": 0}, {"key": "cb4d9818866490b281e8f5529c9957ba366390e7", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.769080244083905, "ground_truth": 0}, {"key": "cb4d9818866490b281e8f5529c9957ba366390e7", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.8267117881041233, "ground_truth": 0}, {"key": "83181eb5628b02f9af1cf8be0b9e3d7841f6f94c", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.7690802569501347, "ground_truth": 0}, {"key": "83181eb5628b02f9af1cf8be0b9e3d7841f6f94c", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.8418256329740681, "ground_truth": 0}, {"key": "83181eb5628b02f9af1cf8be0b9e3d7841f6f94c", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.7577943733553878, "ground_truth": 0}, {"key": "83181eb5628b02f9af1cf8be0b9e3d7841f6f94c", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.7074046983243735, "ground_truth": 0}, {"key": "83181eb5628b02f9af1cf8be0b9e3d7841f6f94c", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.7505527614118848, "ground_truth": 0}, {"key": "addda21620885e1019305bce0cbf308b421dc0ba", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.8807970850468545, "ground_truth": 0}, {"key": "addda21620885e1019305bce0cbf308b421dc0ba", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.8428631439612245, "ground_truth": 0}, {"key": "addda21620885e1019305bce0cbf308b421dc0ba", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.8489721917154247, "ground_truth": 0}, {"key": "addda21620885e1019305bce0cbf308b421dc0ba", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.9362850044763934, "ground_truth": 0}, {"key": "addda21620885e1019305bce0cbf308b421dc0ba", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.9273632963615502, "ground_truth": 0}, {"key": "6a0a6f44de4059e1d7ef83841b3fd5e95e278ba2", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.7745833908880331, "ground_truth": 0}, {"key": "6a0a6f44de4059e1d7ef83841b3fd5e95e278ba2", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.7057850168378705, "ground_truth": 0}, {"key": "6a0a6f44de4059e1d7ef83841b3fd5e95e278ba2", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.8104789038407525, "ground_truth": 0}, {"key": "6a0a6f44de4059e1d7ef83841b3fd5e95e278ba2", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.8210441276865217, "ground_truth": 0}, {"key": "6a0a6f44de4059e1d7ef83841b3fd5e95e278ba2", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.7461389762290441, "ground_truth": 0}, {"key": "b5313efdec6d9afa6f43f26378c6065fcc9c7535", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.7620701044595608, "ground_truth": 0}, {"key": "b5313efdec6d9afa6f43f26378c6065fcc9c7535", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.8116760124024778, "ground_truth": 0}, {"key": "b5313efdec6d9afa6f43f26378c6065fcc9c7535", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.7416740066675175, "ground_truth": 0}, {"key": "b5313efdec6d9afa6f43f26378c6065fcc9c7535", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.87997436507834, "ground_truth": 0}, {"key": "b5313efdec6d9afa6f43f26378c6065fcc9c7535", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.8187367857495346, "ground_truth": 0}, {"key": "0644f27692b67af8f52f9518e29981de11684cd7", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.9658995717152966, "ground_truth": 0}, {"key": "0644f27692b67af8f52f9518e29981de11684cd7", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.9539660999165482, "ground_truth": 0}, {"key": "0644f27692b67af8f52f9518e29981de11684cd7", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.8887587756691736, "ground_truth": 0}, {"key": "0644f27692b67af8f52f9518e29981de11684cd7", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.9252299558796697, "ground_truth": 0}, {"key": "0644f27692b67af8f52f9518e29981de11684cd7", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.9629528298810041, "ground_truth": 0}, {"key": "19dbfe3918d9bdd7b5f1792631c5e3e424146473", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.8962513655122062, "ground_truth": 0}, {"key": "19dbfe3918d9bdd7b5f1792631c5e3e424146473", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.9449947171736695, "ground_truth": 0}, {"key": "19dbfe3918d9bdd7b5f1792631c5e3e424146473", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.9118099612218389, "ground_truth": 0}, {"key": "19dbfe3918d9bdd7b5f1792631c5e3e424146473", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.8976952946621376, "ground_truth": 0}, {"key": "19dbfe3918d9bdd7b5f1792631c5e3e424146473", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.8799743680419521, "ground_truth": 0}, {"key": "0f4fcaf8fd58c40bc31c4715cd230bb0f80f2d98", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.880797076671719, "ground_truth": 0}, {"key": "0f4fcaf8fd58c40bc31c4715cd230bb0f80f2d98", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.8824278641219244, "ground_truth": 0}, {"key": "0f4fcaf8fd58c40bc31c4715cd230bb0f80f2d98", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.8757869995404062, "ground_truth": 0}, {"key": "0f4fcaf8fd58c40bc31c4715cd230bb0f80f2d98", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.8006920007440974, "ground_truth": 0}, {"key": "0f4fcaf8fd58c40bc31c4715cd230bb0f80f2d98", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.8418256478257159, "ground_truth": 0}, {"key": "4aa90d4a364e8bd252a2a2e57f1bb4c9dab57062", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.805632177124597, "ground_truth": 0}, {"key": "4aa90d4a364e8bd252a2a2e57f1bb4c9dab57062", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.9263037272851529, "ground_truth": 0}, {"key": "4aa90d4a364e8bd252a2a2e57f1bb4c9dab57062", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.8848377619373965, "ground_truth": 0}, {"key": "4aa90d4a364e8bd252a2a2e57f1bb4c9dab57062", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.8449215295650351, "ground_truth": 0}, {"key": "4aa90d4a364e8bd252a2a2e57f1bb4c9dab57062", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.8519528107211355, "ground_truth": 0}, {"key": "239d0e3b504e4b9e1e6eb20eb77c8a873a2f5657", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.7826624754423348, "ground_truth": 0}, {"key": "239d0e3b504e4b9e1e6eb20eb77c8a873a2f5657", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.7931059746748289, "ground_truth": 0}, {"key": "239d0e3b504e4b9e1e6eb20eb77c8a873a2f5657", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.7799928738259115, "ground_truth": 0}, {"key": "239d0e3b504e4b9e1e6eb20eb77c8a873a2f5657", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.8152325080107903, "ground_truth": 0}, {"key": "239d0e3b504e4b9e1e6eb20eb77c8a873a2f5657", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.8947894614946993, "ground_truth": 0}, {"key": "6ef705715b84a961f971d624e9574da6a65dd3ef", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.9394706115885256, "ground_truth": 0}, {"key": "6ef705715b84a961f971d624e9574da6a65dd3ef", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.9543079680506212, "ground_truth": 0}, {"key": "6ef705715b84a961f971d624e9574da6a65dd3ef", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.9314625059116313, "ground_truth": 0}, {"key": "6ef705715b84a961f971d624e9574da6a65dd3ef", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.9412234408009986, "ground_truth": 0}, {"key": "6ef705715b84a961f971d624e9574da6a65dd3ef", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.9609517070504429, "ground_truth": 0}, {"key": "e3f24714630bd679c4b4fdb77e90f785beb1ff33", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.8910549513262326, "ground_truth": 0}, {"key": "e3f24714630bd679c4b4fdb77e90f785beb1ff33", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.9319595769492409, "ground_truth": 0}, {"key": "e3f24714630bd679c4b4fdb77e90f785beb1ff33", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.8856314772426723, "ground_truth": 0}, {"key": "e3f24714630bd679c4b4fdb77e90f785beb1ff33", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.9358173547953392, "ground_truth": 0}, {"key": "e3f24714630bd679c4b4fdb77e90f785beb1ff33", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.8918110449156396, "ground_truth": 0}, {"key": "589dc58218fe8920f0949cc7af767b6daf5018bc", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.8791467681899635, "ground_truth": 0}, {"key": "589dc58218fe8920f0949cc7af767b6daf5018bc", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.9268352782596716, "ground_truth": 0}, {"key": "589dc58218fe8920f0949cc7af767b6daf5018bc", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.9066531204091384, "ground_truth": 0}, {"key": "589dc58218fe8920f0949cc7af767b6daf5018bc", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.8732148341482467, "ground_truth": 0}, {"key": "589dc58218fe8920f0949cc7af767b6daf5018bc", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.9230391641949574, "ground_truth": 0}, {"key": "06254d21e94c9c0b027629a1df90298887c31f14", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.8006920003057749, "ground_truth": 0}, {"key": "06254d21e94c9c0b027629a1df90298887c31f14", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.7772998622979064, "ground_truth": 0}, {"key": "06254d21e94c9c0b027629a1df90298887c31f14", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.8187367950788373, "ground_truth": 0}, {"key": "06254d21e94c9c0b027629a1df90298887c31f14", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.7606506671746995, "ground_truth": 0}, {"key": "06254d21e94c9c0b027629a1df90298887c31f14", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.8344068838849601, "ground_truth": 0}, {"key": "5b93cafa2843ab23eb5baf8bb0bec93d0fc46864", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.8210441182814707, "ground_truth": 0}, {"key": "5b93cafa2843ab23eb5baf8bb0bec93d0fc46864", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.8615382258481225, "ground_truth": 0}, {"key": "5b93cafa2843ab23eb5baf8bb0bec93d0fc46864", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.8652240912846664, "ground_truth": 0}, {"key": "5b93cafa2843ab23eb5baf8bb0bec93d0fc46864", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.9124361504558696, "ground_truth": 0}, {"key": "5b93cafa2843ab23eb5baf8bb0bec93d0fc46864", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.8740772329861304, "ground_truth": 0}, {"key": "22f9667453cf7ea8a39080edde645776d5edc6f7", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.8615382044026132, "ground_truth": 0}, {"key": "22f9667453cf7ea8a39080edde645776d5edc6f7", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.647798227971952, "ground_truth": 0}, {"key": "22f9667453cf7ea8a39080edde645776d5edc6f7", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.7577943858750117, "ground_truth": 0}, {"key": "22f9667453cf7ea8a39080edde645776d5edc6f7", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.7813306358338249, "ground_truth": 0}, {"key": "22f9667453cf7ea8a39080edde645776d5edc6f7", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.8006919919254896, "ground_truth": 0}, {"key": "521fc18da417d441ba600a4abdbf279bb0c8f69d", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.8856314734876108, "ground_truth": 0}, {"key": "521fc18da417d441ba600a4abdbf279bb0c8f69d", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.8529354695232, "ground_truth": 0}, {"key": "521fc18da417d441ba600a4abdbf279bb0c8f69d", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.9569571481040623, "ground_truth": 0}, {"key": "521fc18da417d441ba600a4abdbf279bb0c8f69d", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.8539127581113513, "ground_truth": 0}, {"key": "521fc18da417d441ba600a4abdbf279bb0c8f69d", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.9235923186803408, "ground_truth": 0}, {"key": "48fd5553806beaaa508596b0c8267a1ee703a8fe", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.8418256517982383, "ground_truth": 0}, {"key": "48fd5553806beaaa508596b0c8267a1ee703a8fe", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.8879840475132069, "ground_truth": 0}, {"key": "48fd5553806beaaa508596b0c8267a1ee703a8fe", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.8128673056564325, "ground_truth": 0}, {"key": "48fd5553806beaaa508596b0c8267a1ee703a8fe", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.8918110416190512, "ground_truth": 0}, {"key": "48fd5553806beaaa508596b0c8267a1ee703a8fe", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.8116760232094966, "ground_truth": 0}, {"key": "f9b3e0253b7325cd0d37841a38c9f10a22c77c49", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.8962513743263112, "ground_truth": 0}, {"key": "f9b3e0253b7325cd0d37841a38c9f10a22c77c49", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.8606036184464478, "ground_truth": 0}, {"key": "f9b3e0253b7325cd0d37841a38c9f10a22c77c49", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.8633916239469762, "ground_truth": 0}, {"key": "f9b3e0253b7325cd0d37841a38c9f10a22c77c49", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.821044122490885, "ground_truth": 0}, {"key": "f9b3e0253b7325cd0d37841a38c9f10a22c77c49", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.8244619241844616, "ground_truth": 0}, {"key": "3228a9d82b3829a4f09698b746db4036ebb38ad0", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.8596637511171014, "ground_truth": 0}, {"key": "3228a9d82b3829a4f09698b746db4036ebb38ad0", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.9202179872635358, "ground_truth": 0}, {"key": "3228a9d82b3829a4f09698b746db4036ebb38ad0", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.8529354730501859, "ground_truth": 0}, {"key": "3228a9d82b3829a4f09698b746db4036ebb38ad0", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.8068526194908319, "ground_truth": 0}, {"key": "3228a9d82b3829a4f09698b746db4036ebb38ad0", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.7956580961059743, "ground_truth": 0}, {"key": "ee02f2bd6eaf55c06fef208248197679d2d96897", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.858718575117111, "ground_truth": 0}, {"key": "ee02f2bd6eaf55c06fef208248197679d2d96897", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.851952810906323, "ground_truth": 0}, {"key": "ee02f2bd6eaf55c06fef208248197679d2d96897", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.8187367952606139, "ground_truth": 0}, {"key": "ee02f2bd6eaf55c06fef208248197679d2d96897", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.8799743810153131, "ground_truth": 0}, {"key": "ee02f2bd6eaf55c06fef208248197679d2d96897", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.8783142452159436, "ground_truth": 0}, {"key": "c8da607c6ffe49104ceacd4fe484581042e7f21a", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.8128673117269481, "ground_truth": 0}, {"key": "c8da607c6ffe49104ceacd4fe484581042e7f21a", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.7732163722452676, "ground_truth": 0}, {"key": "c8da607c6ffe49104ceacd4fe484581042e7f21a", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.699254417043637, "ground_truth": 0}, {"key": "c8da607c6ffe49104ceacd4fe484581042e7f21a", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.8947894723985176, "ground_truth": 0}, {"key": "c8da607c6ffe49104ceacd4fe484581042e7f21a", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.8940517217252439, "ground_truth": 0}, {"key": "aeca50944e5a49735193304117849531fb4d667d", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.8887587799251868, "ground_truth": 0}, {"key": "aeca50944e5a49735193304117849531fb4d667d", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.8175744723403287, "ground_truth": 0}, {"key": "aeca50944e5a49735193304117849531fb4d667d", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.747615945256182, "ground_truth": 0}, {"key": "aeca50944e5a49735193304117849531fb4d667d", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.7416740423151152, "ground_truth": 0}, {"key": "aeca50944e5a49735193304117849531fb4d667d", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.859663753778491, "ground_truth": 0}, {"key": "301c27b4468420252a14f4c87c2b208c6b3259e1", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.6315942856818233, "ground_truth": 0}, {"key": "301c27b4468420252a14f4c87c2b208c6b3259e1", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.7732163773343588, "ground_truth": 0}, {"key": "301c27b4468420252a14f4c87c2b208c6b3259e1", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.6757645939208947, "ground_truth": 0}, {"key": "301c27b4468420252a14f4c87c2b208c6b3259e1", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.7248702793838796, "ground_truth": 0}, {"key": "301c27b4468420252a14f4c87c2b208c6b3259e1", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.8198933269470137, "ground_truth": 0}, {"key": "9b5fc45f61bff9323a7744c1db605618763cb85c", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.9079671346365481, "ground_truth": 0}, {"key": "9b5fc45f61bff9323a7744c1db605618763cb85c", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.9161096129565086, "ground_truth": 0}, {"key": "9b5fc45f61bff9323a7744c1db605618763cb85c", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.8459424393765829, "ground_truth": 0}, {"key": "9b5fc45f61bff9323a7744c1db605618763cb85c", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.8925625226902967, "ground_truth": 0}, {"key": "9b5fc45f61bff9323a7744c1db605618763cb85c", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.8187367933272904, "ground_truth": 0}, {"key": "43144b95b0f947f2c6d40122fecd69ced8a4af92", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.8723473700659797, "ground_truth": 0}, {"key": "43144b95b0f947f2c6d40122fecd69ced8a4af92", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.8376199658666111, "ground_truth": 0}, {"key": "43144b95b0f947f2c6d40122fecd69ced8a4af92", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.8221891270322709, "ground_truth": 0}, {"key": "43144b95b0f947f2c6d40122fecd69ced8a4af92", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.8354835437583585, "ground_truth": 0}, {"key": "43144b95b0f947f2c6d40122fecd69ced8a4af92", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.8006919961377377, "ground_truth": 0}, {"key": "58b49fef1d6d2be5211848adc2882b59f043a933", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.825589727947827, "ground_truth": 0}, {"key": "58b49fef1d6d2be5211848adc2882b59f043a933", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.8558511513698672, "ground_truth": 0}, {"key": "58b49fef1d6d2be5211848adc2882b59f043a933", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.7905302924393895, "ground_truth": 0}, {"key": "58b49fef1d6d2be5211848adc2882b59f043a933", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.855851149728573, "ground_truth": 0}, {"key": "58b49fef1d6d2be5211848adc2882b59f043a933", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.8714748662685673, "ground_truth": 0}, {"key": "bdcc1253f679b14e54451db44f4f0e39af4bb559", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.9284088011647512, "ground_truth": 0}, {"key": "bdcc1253f679b14e54451db44f4f0e39af4bb559", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.9079671429800947, "ground_truth": 0}, {"key": "bdcc1253f679b14e54451db44f4f0e39af4bb559", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.8872046013315813, "ground_truth": 0}, {"key": "bdcc1253f679b14e54451db44f4f0e39af4bb559", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.9099070083752306, "ground_truth": 0}, {"key": "bdcc1253f679b14e54451db44f4f0e39af4bb559", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.9485372337856847, "ground_truth": 0}, {"key": "b22b1636da5dd15364b6f0c342e4ce4903e51c2a", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.8418256672843588, "ground_truth": 0}, {"key": "b22b1636da5dd15364b6f0c342e4ce4903e51c2a", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.760650648577497, "ground_truth": 0}, {"key": "b22b1636da5dd15364b6f0c342e4ce4903e51c2a", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.8164063799386349, "ground_truth": 0}, {"key": "b22b1636da5dd15364b6f0c342e4ce4903e51c2a", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.9105454121325495, "ground_truth": 0}, {"key": "b22b1636da5dd15364b6f0c342e4ce4903e51c2a", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.8587185899964845, "ground_truth": 0}, {"key": "55986d11e0d0e5b031567157cf1f157610c65c31", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.8244619411636781, "ground_truth": 0}, {"key": "55986d11e0d0e5b031567157cf1f157610c65c31", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.8255897246000059, "ground_truth": 0}, {"key": "55986d11e0d0e5b031567157cf1f157610c65c31", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.8006920058082668, "ground_truth": 0}, {"key": "55986d11e0d0e5b031567157cf1f157610c65c31", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.7676898755535165, "ground_truth": 0}, {"key": "55986d11e0d0e5b031567157cf1f157610c65c31", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.5640984548017133, "ground_truth": 0}, {"key": "0a37124fe35e31ae9fe8dd7715aeed88002e23e9", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.8568122987392687, "ground_truth": 0}, {"key": "0a37124fe35e31ae9fe8dd7715aeed88002e23e9", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.7905303236453918, "ground_truth": 0}, {"key": "0a37124fe35e31ae9fe8dd7715aeed88002e23e9", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.7563575458276199, "ground_truth": 0}, {"key": "0a37124fe35e31ae9fe8dd7715aeed88002e23e9", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.684264011557134, "ground_truth": 0}, {"key": "0a37124fe35e31ae9fe8dd7715aeed88002e23e9", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.7154239979358605, "ground_truth": 0}, {"key": "ef3ee3ab85ed8802b6b76444bccb46256077963e", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.7170118739340362, "ground_truth": 0}, {"key": "ef3ee3ab85ed8802b6b76444bccb46256077963e", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.7718435016261407, "ground_truth": 0}, {"key": "ef3ee3ab85ed8802b6b76444bccb46256077963e", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.7969253705918843, "ground_truth": 0}, {"key": "ef3ee3ab85ed8802b6b76444bccb46256077963e", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.5736784113882971, "ground_truth": 0}, {"key": "ef3ee3ab85ed8802b6b76444bccb46256077963e", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.787931199486233, "ground_truth": 0}, {"key": "fb17ac082bd3f3af3dad8c8d36d9ea56360c520e", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.901227412825183, "ground_truth": 0}, {"key": "fb17ac082bd3f3af3dad8c8d36d9ea56360c520e", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.8723473798795353, "ground_truth": 0}, {"key": "fb17ac082bd3f3af3dad8c8d36d9ea56360c520e", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.9403530608629918, "ground_truth": 0}, {"key": "fb17ac082bd3f3af3dad8c8d36d9ea56360c520e", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.9477691417353196, "ground_truth": 0}, {"key": "fb17ac082bd3f3af3dad8c8d36d9ea56360c520e", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.8962513678307756, "ground_truth": 0}, {"key": "59f079f6095cbb82b0eaaa0ba5fc29cdaff1f81b", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.8376199699305616, "ground_truth": 0}, {"key": "59f079f6095cbb82b0eaaa0ba5fc29cdaff1f81b", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.8783142487652612, "ground_truth": 0}, {"key": "59f079f6095cbb82b0eaaa0ba5fc29cdaff1f81b", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.9118099505781712, "ground_truth": 0}, {"key": "59f079f6095cbb82b0eaaa0ba5fc29cdaff1f81b", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.8832359884977915, "ground_truth": 0}, {"key": "59f079f6095cbb82b0eaaa0ba5fc29cdaff1f81b", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.8300437698642461, "ground_truth": 0}, {"key": "083bc4309f2ea52be2a378e78566d7dcc9f4dd73", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.8783142464721407, "ground_truth": 0}, {"key": "083bc4309f2ea52be2a378e78566d7dcc9f4dd73", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.921357615877791, "ground_truth": 0}, {"key": "083bc4309f2ea52be2a378e78566d7dcc9f4dd73", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.8976952977728596, "ground_truth": 0}, {"key": "083bc4309f2ea52be2a378e78566d7dcc9f4dd73", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.9073122176838428, "ground_truth": 0}, {"key": "083bc4309f2ea52be2a378e78566d7dcc9f4dd73", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.8757869922821452, "ground_truth": 0}, {"key": "ac56bd50e449bfa1d7b923415afa2ae5f7c83392", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.8615382031742277, "ground_truth": 0}, {"key": "ac56bd50e449bfa1d7b923415afa2ae5f7c83392", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.9155072444977305, "ground_truth": 0}, {"key": "ac56bd50e449bfa1d7b923415afa2ae5f7c83392", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.8856314741543895, "ground_truth": 0}, {"key": "ac56bd50e449bfa1d7b923415afa2ae5f7c83392", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.9092645147421146, "ground_truth": 0}, {"key": "ac56bd50e449bfa1d7b923415afa2ae5f7c83392", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.8976952975710756, "ground_truth": 0}, {"key": "61e4747776bd844146a9b8c7c1913c827ffbcd8a", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.9640516759902694, "ground_truth": 0}, {"key": "61e4747776bd844146a9b8c7c1913c827ffbcd8a", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.9674102579314537, "ground_truth": 0}, {"key": "61e4747776bd844146a9b8c7c1913c827ffbcd8a", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.9730364982948546, "ground_truth": 0}, {"key": "61e4747776bd844146a9b8c7c1913c827ffbcd8a", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.964855152819788, "ground_truth": 0}, {"key": "61e4747776bd844146a9b8c7c1913c827ffbcd8a", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.9640516751155341, "ground_truth": 0}, {"key": "a9854fc40719b0d083a3fd279b6196188228a4e0", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.7704647748210707, "ground_truth": 0}, {"key": "a9854fc40719b0d083a3fd279b6196188228a4e0", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.8175744729096686, "ground_truth": 0}, {"key": "a9854fc40719b0d083a3fd279b6196188228a4e0", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.8019358199243921, "ground_truth": 0}, {"key": "a9854fc40719b0d083a3fd279b6196188228a4e0", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.798186780112243, "ground_truth": 0}, {"key": "a9854fc40719b0d083a3fd279b6196188228a4e0", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.7534666522536069, "ground_truth": 0}, {"key": "8d37ab9fcd0248c093f6d0e5682782ebdaf5e837", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.9111797127000134, "ground_truth": 0}, {"key": "8d37ab9fcd0248c093f6d0e5682782ebdaf5e837", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.9367494775931241, "ground_truth": 0}, {"key": "8d37ab9fcd0248c093f6d0e5682782ebdaf5e837", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.8774767975245821, "ground_truth": 0}, {"key": "8d37ab9fcd0248c093f6d0e5682782ebdaf5e837", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.8568123031219869, "ground_truth": 0}, {"key": "8d37ab9fcd0248c093f6d0e5682782ebdaf5e837", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.9092645109151112, "ground_truth": 0}, {"key": "d3199d123dedcdbae55b2e9d1f658717c1d5e233", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.5640984840226584, "ground_truth": 0}, {"key": "d3199d123dedcdbae55b2e9d1f658717c1d5e233", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.6774739890392892, "ground_truth": 0}, {"key": "d3199d123dedcdbae55b2e9d1f658717c1d5e233", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.6132365418914885, "ground_truth": 0}, {"key": "d3199d123dedcdbae55b2e9d1f658717c1d5e233", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.7122321662448188, "ground_truth": 0}, {"key": "d3199d123dedcdbae55b2e9d1f658717c1d5e233", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.5698526613596838, "ground_truth": 0}, {"key": "f249ede5a3cafd2506ff2bb400291a7db1c43b76", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.8128673169218549, "ground_truth": 0}, {"key": "f249ede5a3cafd2506ff2bb400291a7db1c43b76", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.8969755655967915, "ground_truth": 0}, {"key": "f249ede5a3cafd2506ff2bb400291a7db1c43b76", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.8955226807777524, "ground_truth": 0}, {"key": "f249ede5a3cafd2506ff2bb400291a7db1c43b76", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.7786493395825265, "ground_truth": 0}, {"key": "f249ede5a3cafd2506ff2bb400291a7db1c43b76", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.8333245940416396, "ground_truth": 0}, {"key": "6343a202a70e8c5d3bfa4042bfd087d78ca5805e", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.8824278602366017, "ground_truth": 0}, {"key": "6343a202a70e8c5d3bfa4042bfd087d78ca5805e", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.7956580953861965, "ground_truth": 0}, {"key": "6343a202a70e8c5d3bfa4042bfd087d78ca5805e", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.8140527996200501, "ground_truth": 0}, {"key": "6343a202a70e8c5d3bfa4042bfd087d78ca5805e", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.8056321811340661, "ground_truth": 0}, {"key": "6343a202a70e8c5d3bfa4042bfd087d78ca5805e", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.8267117841790045, "ground_truth": 0}, {"key": "da0d41b431367b51fd995573cb498c10b7f64ca0", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.8365545608103545, "ground_truth": 0}, {"key": "da0d41b431367b51fd995573cb498c10b7f64ca0", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.9073122241917684, "ground_truth": 0}, {"key": "da0d41b431367b51fd995573cb498c10b7f64ca0", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.9032942102190137, "ground_truth": 0}, {"key": "da0d41b431367b51fd995573cb498c10b7f64ca0", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.8661325157444721, "ground_truth": 0}, {"key": "da0d41b431367b51fd995573cb498c10b7f64ca0", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.9202179799225876, "ground_truth": 0}, {"key": "0620ff5fa324a35b4be54bbd2de49b42bdd0d7c0", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.7490872037886238, "ground_truth": 0}, {"key": "0620ff5fa324a35b4be54bbd2de49b42bdd0d7c0", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.8757869930182401, "ground_truth": 0}, {"key": "0620ff5fa324a35b4be54bbd2de49b42bdd0d7c0", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.8757869898935038, "ground_truth": 0}, {"key": "0620ff5fa324a35b4be54bbd2de49b42bdd0d7c0", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.8509646979348188, "ground_truth": 0}, {"key": "0620ff5fa324a35b4be54bbd2de49b42bdd0d7c0", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.7981867864294436, "ground_truth": 0}, {"key": "f0eb8f9eee266512eb604a51b482833e202531d8", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.8918110444572804, "ground_truth": 0}, {"key": "f0eb8f9eee266512eb604a51b482833e202531d8", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.8955226766580942, "ground_truth": 0}, {"key": "f0eb8f9eee266512eb604a51b482833e202531d8", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.8766343815866136, "ground_truth": 0}, {"key": "f0eb8f9eee266512eb604a51b482833e202531d8", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.8705972671212759, "ground_truth": 0}, {"key": "f0eb8f9eee266512eb604a51b482833e202531d8", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.9099070008479746, "ground_truth": 0}, {"key": "c8f743307d5d1f7f19f1474d68c9390b22f6d076", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.8068526113599958, "ground_truth": 0}, {"key": "c8f743307d5d1f7f19f1474d68c9390b22f6d076", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.749087218126942, "ground_truth": 0}, {"key": "c8f743307d5d1f7f19f1474d68c9390b22f6d076", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.9073122201622185, "ground_truth": 0}, {"key": "c8f743307d5d1f7f19f1474d68c9390b22f6d076", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.8104789238079367, "ground_truth": 0}, {"key": "c8f743307d5d1f7f19f1474d68c9390b22f6d076", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.8244619063180497, "ground_truth": 0}, {"key": "5978abfdad91e604840a2dcc993df5ade9448e82", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.8221891502580053, "ground_truth": 0}, {"key": "5978abfdad91e604840a2dcc993df5ade9448e82", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.8643104541141783, "ground_truth": 0}, {"key": "5978abfdad91e604840a2dcc993df5ade9448e82", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.7490872018425253, "ground_truth": 0}, {"key": "5978abfdad91e604840a2dcc993df5ade9448e82", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.763483770524219, "ground_truth": 0}, {"key": "5978abfdad91e604840a2dcc993df5ade9448e82", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.8365545567377868, "ground_truth": 0}, {"key": "5bcd4e61b39cc7ffff38ad88cd40afa208b18528", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.8816148971927527, "ground_truth": 0}, {"key": "5bcd4e61b39cc7ffff38ad88cd40afa208b18528", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.9005297858014937, "ground_truth": 0}, {"key": "5bcd4e61b39cc7ffff38ad88cd40afa208b18528", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.7969253777029397, "ground_truth": 0}, {"key": "5bcd4e61b39cc7ffff38ad88cd40afa208b18528", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.7534666464846925, "ground_truth": 0}, {"key": "5bcd4e61b39cc7ffff38ad88cd40afa208b18528", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.8848377707441781, "ground_truth": 0}, {"key": "44815c184e3013f07781311b30ec5ff009174738", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.7918210507049765, "ground_truth": 0}, {"key": "44815c184e3013f07781311b30ec5ff009174738", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.8670357511406118, "ground_truth": 0}, {"key": "44815c184e3013f07781311b30ec5ff009174738", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.8615382090210442, "ground_truth": 0}, {"key": "44815c184e3013f07781311b30ec5ff009174738", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.8152324827155718, "ground_truth": 0}, {"key": "44815c184e3013f07781311b30ec5ff009174738", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.7813306184318696, "ground_truth": 0}, {"key": "d7783bd2bf5ad92156962380342411c2eb068853", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.8816149119681975, "ground_truth": 0}, {"key": "d7783bd2bf5ad92156962380342411c2eb068853", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.8848377811248093, "ground_truth": 0}, {"key": "d7783bd2bf5ad92156962380342411c2eb068853", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.8175744960146606, "ground_truth": 0}, {"key": "d7783bd2bf5ad92156962380342411c2eb068853", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.8233283942207847, "ground_truth": 0}, {"key": "d7783bd2bf5ad92156962380342411c2eb068853", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.882427858641535, "ground_truth": 0}, {"key": "4963edb0ad2703e9f6c54593149d9b81e7ada91f", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.7074046909063354, "ground_truth": 0}, {"key": "4963edb0ad2703e9f6c54593149d9b81e7ada91f", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.7745833877510959, "ground_truth": 0}, {"key": "4963edb0ad2703e9f6c54593149d9b81e7ada91f", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.6740504806920707, "ground_truth": 0}, {"key": "4963edb0ad2703e9f6c54593149d9b81e7ada91f", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.6242935027733153, "ground_truth": 0}, {"key": "4963edb0ad2703e9f6c54593149d9b81e7ada91f", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.8198933478428632, "ground_truth": 0}, {"key": "51b9a2d46dac43952e713874a5769be5ae350626", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.863391596268246, "ground_truth": 0}, {"key": "51b9a2d46dac43952e713874a5769be5ae350626", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.8489721851089469, "ground_truth": 0}, {"key": "51b9a2d46dac43952e713874a5769be5ae350626", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.8407826047314172, "ground_truth": 0}, {"key": "51b9a2d46dac43952e713874a5769be5ae350626", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.8233283875488573, "ground_truth": 0}, {"key": "51b9a2d46dac43952e713874a5769be5ae350626", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.8791467560489084, "ground_truth": 0}, {"key": "d670da295571f998bd0864540e2acd109d077131", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.9073122224446838, "ground_truth": 0}, {"key": "d670da295571f998bd0864540e2acd109d077131", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.8799743644879092, "ground_truth": 0}, {"key": "d670da295571f998bd0864540e2acd109d077131", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.8198933341616821, "ground_truth": 0}, {"key": "d670da295571f998bd0864540e2acd109d077131", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.911179711956744, "ground_truth": 0}, {"key": "d670da295571f998bd0864540e2acd109d077131", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.9032942100750996, "ground_truth": 0}, {"key": "f2f2246150d06734b2fab694a39bd8d693c7d255", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.7295197792973873, "ground_truth": 0}, {"key": "f2f2246150d06734b2fab694a39bd8d693c7d255", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.7401743387663747, "ground_truth": 0}, {"key": "f2f2246150d06734b2fab694a39bd8d693c7d255", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.7866228304333573, "ground_truth": 0}, {"key": "f2f2246150d06734b2fab694a39bd8d693c7d255", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.7918210653683483, "ground_truth": 0}, {"key": "f2f2246150d06734b2fab694a39bd8d693c7d255", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.744656360125962, "ground_truth": 0}, {"key": "3cc0409612242093f34ea1d8ca1679f434955cff", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.7074047031714097, "ground_truth": 0}, {"key": "3cc0409612242093f34ea1d8ca1679f434955cff", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.8864204152688202, "ground_truth": 0}, {"key": "3cc0409612242093f34ea1d8ca1679f434955cff", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.8198933359934196, "ground_truth": 0}, {"key": "3cc0409612242093f34ea1d8ca1679f434955cff", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.8031737952065977, "ground_truth": 0}, {"key": "3cc0409612242093f34ea1d8ca1679f434955cff", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.8596637419571831, "ground_truth": 0}, {"key": "a67c4eaf797da7df18a715cd30c6cf11db96c954", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.7592254094192373, "ground_truth": 0}, {"key": "a67c4eaf797da7df18a715cd30c6cf11db96c954", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.8300437644687788, "ground_truth": 0}, {"key": "a67c4eaf797da7df18a715cd30c6cf11db96c954", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.7431680182354283, "ground_truth": 0}, {"key": "a67c4eaf797da7df18a715cd30c6cf11db96c954", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.7106282918867358, "ground_truth": 0}, {"key": "a67c4eaf797da7df18a715cd30c6cf11db96c954", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.8354835334584575, "ground_truth": 0}, {"key": "58456413c8bd03a8ce70eb0061af07c6a9824fc3", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.687630008898921, "ground_truth": 0}, {"key": "58456413c8bd03a8ce70eb0061af07c6a9824fc3", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.804405915707808, "ground_truth": 0}, {"key": "58456413c8bd03a8ce70eb0061af07c6a9824fc3", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.7371581405360038, "ground_truth": 0}, {"key": "58456413c8bd03a8ce70eb0061af07c6a9824fc3", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.7826624666152745, "ground_truth": 0}, {"key": "58456413c8bd03a8ce70eb0061af07c6a9824fc3", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.8397339771074644, "ground_truth": 0}, {"key": "da040b67082b56436ccc8479a4e435cbf892a1f2", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.7233094799958957, "ground_truth": 0}, {"key": "da040b67082b56436ccc8479a4e435cbf892a1f2", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.7008948110914098, "ground_truth": 0}, {"key": "da040b67082b56436ccc8479a4e435cbf892a1f2", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.7956581053917805, "ground_truth": 0}, {"key": "da040b67082b56436ccc8479a4e435cbf892a1f2", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.8670357650629357, "ground_truth": 0}, {"key": "da040b67082b56436ccc8479a4e435cbf892a1f2", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.7969253729963789, "ground_truth": 0}, {"key": "c71748bb246a2b05e676862b75b38fa03bf6646e", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.7956580955648336, "ground_truth": 0}, {"key": "c71748bb246a2b05e676862b75b38fa03bf6646e", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.8244619323698292, "ground_truth": 0}, {"key": "c71748bb246a2b05e676862b75b38fa03bf6646e", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.7154239931284757, "ground_truth": 0}, {"key": "c71748bb246a2b05e676862b75b38fa03bf6646e", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.8679338481141025, "ground_truth": 0}, {"key": "c71748bb246a2b05e676862b75b38fa03bf6646e", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.8438950897107244, "ground_truth": 0}, {"key": "800f8dc06596c30444526bf31dd0db7504391a82", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.7943849679972574, "ground_truth": 0}, {"key": "800f8dc06596c30444526bf31dd0db7504391a82", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.8300437646284169, "ground_truth": 0}, {"key": "800f8dc06596c30444526bf31dd0db7504391a82", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.8615381971322824, "ground_truth": 0}, {"key": "800f8dc06596c30444526bf31dd0db7504391a82", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.717011882703515, "ground_truth": 0}, {"key": "800f8dc06596c30444526bf31dd0db7504391a82", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.8539127537485343, "ground_truth": 0}, {"key": "3b0ed227dc7e5292e302183282d8bbe23d7b1db2", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.7534666617967275, "ground_truth": 0}, {"key": "3b0ed227dc7e5292e302183282d8bbe23d7b1db2", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.7662936415750845, "ground_truth": 0}, {"key": "3b0ed227dc7e5292e302183282d8bbe23d7b1db2", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.7772998608091353, "ground_truth": 0}, {"key": "3b0ed227dc7e5292e302183282d8bbe23d7b1db2", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.7981867759200542, "ground_truth": 0}, {"key": "3b0ed227dc7e5292e302183282d8bbe23d7b1db2", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.8080672009128813, "ground_truth": 0}, {"key": "1e713005e16983f75222235967c0cbeb0b944f80", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.894051718012712, "ground_truth": 0}, {"key": "1e713005e16983f75222235967c0cbeb0b944f80", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.907312221656441, "ground_truth": 0}, {"key": "1e713005e16983f75222235967c0cbeb0b944f80", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.88483776185124, "ground_truth": 0}, {"key": "1e713005e16983f75222235967c0cbeb0b944f80", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.8816149044901735, "ground_truth": 0}, {"key": "1e713005e16983f75222235967c0cbeb0b944f80", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.8947894666126917, "ground_truth": 0}, {"key": "360ae10bc8bd30a2aca7bc6b7000e138af63adb1", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.9053222963775799, "ground_truth": 0}, {"key": "360ae10bc8bd30a2aca7bc6b7000e138af63adb1", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.8832359891356178, "ground_truth": 0}, {"key": "360ae10bc8bd30a2aca7bc6b7000e138af63adb1", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.8365545615009543, "ground_truth": 0}, {"key": "360ae10bc8bd30a2aca7bc6b7000e138af63adb1", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.8459424383191453, "ground_truth": 0}, {"key": "360ae10bc8bd30a2aca7bc6b7000e138af63adb1", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.9648551517234913, "ground_truth": 0}, {"key": "50e996059a005d15e3e89b5a3c3695309671ed34", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.7025300620377563, "ground_truth": 0}, {"key": "50e996059a005d15e3e89b5a3c3695309671ed34", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.8539127658966773, "ground_truth": 0}, {"key": "50e996059a005d15e3e89b5a3c3695309671ed34", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.8652240804602471, "ground_truth": 0}, {"key": "50e996059a005d15e3e89b5a3c3695309671ed34", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.8568123058475922, "ground_truth": 0}, {"key": "50e996059a005d15e3e89b5a3c3695309671ed34", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.8418256513124615, "ground_truth": 0}, {"key": "ccc7f6a2139593c47f6b5880f1e3eef9e7a69734", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.9196425337894224, "ground_truth": 0}, {"key": "ccc7f6a2139593c47f6b5880f1e3eef9e7a69734", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.7732163731256296, "ground_truth": 0}, {"key": "ccc7f6a2139593c47f6b5880f1e3eef9e7a69734", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.8333246014626327, "ground_truth": 0}, {"key": "ccc7f6a2139593c47f6b5880f1e3eef9e7a69734", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.8643104523527267, "ground_truth": 0}, {"key": "ccc7f6a2139593c47f6b5880f1e3eef9e7a69734", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.8807970794639893, "ground_truth": 0}, {"key": "f4f90d4ff5af3e3648055673e040f0f43ae076d2", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.9111797150747596, "ground_truth": 0}, {"key": "f4f90d4ff5af3e3648055673e040f0f43ae076d2", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.8856314726114046, "ground_truth": 0}, {"key": "f4f90d4ff5af3e3648055673e040f0f43ae076d2", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.9219218405553152, "ground_truth": 0}, {"key": "f4f90d4ff5af3e3648055673e040f0f43ae076d2", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.879974375428838, "ground_truth": 0}, {"key": "f4f90d4ff5af3e3648055673e040f0f43ae076d2", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.9230391625095521, "ground_truth": 0}, {"key": "6c9ec6b9d3e936d2394f74354d577fdfcdd985a3", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.7620701075102504, "ground_truth": 0}, {"key": "6c9ec6b9d3e936d2394f74354d577fdfcdd985a3", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.8933094024619596, "ground_truth": 0}, {"key": "6c9ec6b9d3e936d2394f74354d577fdfcdd985a3", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.8354835398881871, "ground_truth": 0}, {"key": "6c9ec6b9d3e936d2394f74354d577fdfcdd985a3", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.7839884649205285, "ground_truth": 0}, {"key": "6c9ec6b9d3e936d2394f74354d577fdfcdd985a3", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.7416740239223699, "ground_truth": 0}, {"key": "438a2046f4465fb1f6dab1cb327ef9ca86a4cc0d", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.8267118031129544, "ground_truth": 0}, {"key": "438a2046f4465fb1f6dab1cb327ef9ca86a4cc0d", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.7759445410976251, "ground_truth": 0}, {"key": "438a2046f4465fb1f6dab1cb327ef9ca86a4cc0d", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.7106283056020822, "ground_truth": 0}, {"key": "438a2046f4465fb1f6dab1cb327ef9ca86a4cc0d", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.7759445573421548, "ground_truth": 0}, {"key": "438a2046f4465fb1f6dab1cb327ef9ca86a4cc0d", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.8418256530466397, "ground_truth": 0}, {"key": "73818f6c987b3604b8bc92c4fb03bc68af196b77", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.7431680111953761, "ground_truth": 0}, {"key": "73818f6c987b3604b8bc92c4fb03bc68af196b77", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.8418256482210723, "ground_truth": 0}, {"key": "73818f6c987b3604b8bc92c4fb03bc68af196b77", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.8104789035838017, "ground_truth": 0}, {"key": "73818f6c987b3604b8bc92c4fb03bc68af196b77", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.7549149894196265, "ground_truth": 0}, {"key": "73818f6c987b3604b8bc92c4fb03bc68af196b77", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.8596637522924272, "ground_truth": 0}, {"key": "f06d91f46326752b02cdc48e8fa472dcc38a0846", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.8104788962639404, "ground_truth": 0}, {"key": "f06d91f46326752b02cdc48e8fa472dcc38a0846", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.8633915958423813, "ground_truth": 0}, {"key": "f06d91f46326752b02cdc48e8fa472dcc38a0846", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.8449215289724232, "ground_truth": 0}, {"key": "f06d91f46326752b02cdc48e8fa472dcc38a0846", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.804405929717798, "ground_truth": 0}, {"key": "f06d91f46326752b02cdc48e8fa472dcc38a0846", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.8670357568339918, "ground_truth": 0}, {"key": "c54bee6384d58517757ad5a8a30ea6dc59980a07", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.8661325119531791, "ground_truth": 0}, {"key": "c54bee6384d58517757ad5a8a30ea6dc59980a07", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.7563575311972025, "ground_truth": 0}, {"key": "c54bee6384d58517757ad5a8a30ea6dc59980a07", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.6601723865454877, "ground_truth": 0}, {"key": "c54bee6384d58517757ad5a8a30ea6dc59980a07", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.7994423185871593, "ground_truth": 0}, {"key": "c54bee6384d58517757ad5a8a30ea6dc59980a07", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.8872045963731192, "ground_truth": 0}, {"key": "2757ff294ae08e977ed6a2b6e1854210f28f12c9", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.9268352832815404, "ground_truth": 0}, {"key": "2757ff294ae08e977ed6a2b6e1854210f28f12c9", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.9492946362417797, "ground_truth": 0}, {"key": "2757ff294ae08e977ed6a2b6e1854210f28f12c9", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.9394706069730738, "ground_truth": 0}, {"key": "2757ff294ae08e977ed6a2b6e1854210f28f12c9", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.9329437123699039, "ground_truth": 0}, {"key": "2757ff294ae08e977ed6a2b6e1854210f28f12c9", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.9420819090806324, "ground_truth": 0}, {"key": "6a004c991c482f664ab8ac78df0bda26860b1c7a", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.6315942986968088, "ground_truth": 0}, {"key": "6a004c991c482f664ab8ac78df0bda26860b1c7a", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.8438951160853959, "ground_truth": 0}, {"key": "6a004c991c482f664ab8ac78df0bda26860b1c7a", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.6224592874398374, "ground_truth": 0}, {"key": "6a004c991c482f664ab8ac78df0bda26860b1c7a", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.7090191578652574, "ground_truth": 0}, {"key": "6a004c991c482f664ab8ac78df0bda26860b1c7a", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.6636689615279086, "ground_truth": 0}, {"key": "69159eadf4dcb2b7850f3a4db6454f8209f33e3a", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.9252299588616077, "ground_truth": 0}, {"key": "69159eadf4dcb2b7850f3a4db6454f8209f33e3a", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.9167080753719511, "ground_truth": 0}, {"key": "69159eadf4dcb2b7850f3a4db6454f8209f33e3a", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.9319595734491486, "ground_truth": 0}, {"key": "69159eadf4dcb2b7850f3a4db6454f8209f33e3a", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.9230391619553397, "ground_truth": 0}, {"key": "69159eadf4dcb2b7850f3a4db6454f8209f33e3a", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.9304582613727519, "ground_truth": 0}, {"key": "c6129a4c1fbd5680f512da18fb60a19a74f4959e", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.8418256531908271, "ground_truth": 0}, {"key": "c6129a4c1fbd5680f512da18fb60a19a74f4959e", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.6926419751119405, "ground_truth": 0}, {"key": "c6129a4c1fbd5680f512da18fb60a19a74f4959e", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.6876299922458455, "ground_truth": 0}, {"key": "c6129a4c1fbd5680f512da18fb60a19a74f4959e", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.8311430461767837, "ground_truth": 0}, {"key": "c6129a4c1fbd5680f512da18fb60a19a74f4959e", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.7662936397229032, "ground_truth": 0}, {"key": "1fe7d16db2c7a742dc1bcf04bfb8e285e7909f03", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.8116760055026465, "ground_truth": 0}, {"key": "1fe7d16db2c7a742dc1bcf04bfb8e285e7909f03", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.6909762949978561, "ground_truth": 0}, {"key": "1fe7d16db2c7a742dc1bcf04bfb8e285e7909f03", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.7634837697210884, "ground_truth": 0}, {"key": "1fe7d16db2c7a742dc1bcf04bfb8e285e7909f03", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.7931059405033655, "ground_truth": 0}, {"key": "1fe7d16db2c7a742dc1bcf04bfb8e285e7909f03", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.7106283112495311, "ground_truth": 0}, {"key": "e0ddf766661004eb3ff337d95e249073410f0755", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.8962513658497396, "ground_truth": 0}, {"key": "e0ddf766661004eb3ff337d95e249073410f0755", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.9059898168365429, "ground_truth": 0}, {"key": "e0ddf766661004eb3ff337d95e249073410f0755", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.6959583220411851, "ground_truth": 0}, {"key": "e0ddf766661004eb3ff337d95e249073410f0755", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.8766343777405724, "ground_truth": 0}, {"key": "e0ddf766661004eb3ff337d95e249073410f0755", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.809275991087596, "ground_truth": 0}, {"key": "dd37d70b837b24247e9abafe8fb5bc5fae5de464", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.7826624782956241, "ground_truth": 0}, {"key": "dd37d70b837b24247e9abafe8fb5bc5fae5de464", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.863391594181734, "ground_truth": 0}, {"key": "dd37d70b837b24247e9abafe8fb5bc5fae5de464", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.8311430490483804, "ground_truth": 0}, {"key": "dd37d70b837b24247e9abafe8fb5bc5fae5de464", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.8577681115281651, "ground_truth": 0}, {"key": "dd37d70b837b24247e9abafe8fb5bc5fae5de464", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.8615382104580341, "ground_truth": 0}, {"key": "6e3028e9ae17ab59abc7732fe840468ac9dcb60c", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.8407825919606657, "ground_truth": 0}, {"key": "6e3028e9ae17ab59abc7732fe840468ac9dcb60c", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.8799743744725292, "ground_truth": 0}, {"key": "6e3028e9ae17ab59abc7732fe840468ac9dcb60c", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.8449215272512416, "ground_truth": 0}, {"key": "6e3028e9ae17ab59abc7732fe840468ac9dcb60c", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.7839884725236081, "ground_truth": 0}, {"key": "6e3028e9ae17ab59abc7732fe840468ac9dcb60c", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.855851146366033, "ground_truth": 0}, {"key": "24d2f15f65bfb5608c75d19ba07fc410aab4d9c6", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.9840936084730663, "ground_truth": 0}, {"key": "24d2f15f65bfb5608c75d19ba07fc410aab4d9c6", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.9840936086161876, "ground_truth": 0}, {"key": "24d2f15f65bfb5608c75d19ba07fc410aab4d9c6", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.9905874101167957, "ground_truth": 0}, {"key": "24d2f15f65bfb5608c75d19ba07fc410aab4d9c6", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.9839708538655171, "ground_truth": 0}, {"key": "24d2f15f65bfb5608c75d19ba07fc410aab4d9c6", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.9867771785307021, "ground_truth": 0}, {"key": "698329cc7a8d796d7635bf59d2435aa22c1a38e6", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.9039745108393229, "ground_truth": 0}, {"key": "698329cc7a8d796d7635bf59d2435aa22c1a38e6", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.8902942288658737, "ground_truth": 0}, {"key": "698329cc7a8d796d7635bf59d2435aa22c1a38e6", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.9118099527066443, "ground_truth": 0}, {"key": "698329cc7a8d796d7635bf59d2435aa22c1a38e6", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.9130583434252274, "ground_truth": 0}, {"key": "698329cc7a8d796d7635bf59d2435aa22c1a38e6", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.7534666687651013, "ground_truth": 0}, {"key": "b531a8ba685e8d461d0a491f35c9970c3dddf3dd", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.7648915917347627, "ground_truth": 0}, {"key": "b531a8ba685e8d461d0a491f35c9970c3dddf3dd", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.7217431948159855, "ground_truth": 0}, {"key": "b531a8ba685e8d461d0a491f35c9970c3dddf3dd", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.759225403081094, "ground_truth": 0}, {"key": "b531a8ba685e8d461d0a491f35c9970c3dddf3dd", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.80685261779417, "ground_truth": 0}, {"key": "b531a8ba685e8d461d0a491f35c9970c3dddf3dd", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.830043770692566, "ground_truth": 0}, {"key": "5b0e686b4679910743337ce02b36dd71a5caf5eb", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.6808786239450731, "ground_truth": 0}, {"key": "5b0e686b4679910743337ce02b36dd71a5caf5eb", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.7905303112863046, "ground_truth": 0}, {"key": "5b0e686b4679910743337ce02b36dd71a5caf5eb", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.7401743453269278, "ground_truth": 0}, {"key": "5b0e686b4679910743337ce02b36dd71a5caf5eb", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.6976089199951585, "ground_truth": 0}, {"key": "5b0e686b4679910743337ce02b36dd71a5caf5eb", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.8333245976062433, "ground_truth": 0}, {"key": "980e6db610d9882443d61e36d955f02d983d3e76", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.663668948742799, "ground_truth": 0}, {"key": "980e6db610d9882443d61e36d955f02d983d3e76", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.8354835516444942, "ground_truth": 0}, {"key": "980e6db610d9882443d61e36d955f02d983d3e76", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.7170118975604194, "ground_truth": 0}, {"key": "980e6db610d9882443d61e36d955f02d983d3e76", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.8489721967712833, "ground_truth": 0}, {"key": "980e6db610d9882443d61e36d955f02d983d3e76", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.8529354709046887, "ground_truth": 0}, {"key": "6c18984d8f30ce196e9399200dd15e373e699267", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.8568122945393989, "ground_truth": 0}, {"key": "6c18984d8f30ce196e9399200dd15e373e699267", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.7759445688337366, "ground_truth": 0}, {"key": "6c18984d8f30ce196e9399200dd15e373e699267", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.7704648022444449, "ground_truth": 0}, {"key": "6c18984d8f30ce196e9399200dd15e373e699267", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.7704648026672987, "ground_truth": 0}, {"key": "6c18984d8f30ce196e9399200dd15e373e699267", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.6976088915403844, "ground_truth": 0}, {"key": "e00f05efe2038fffc8eaa1e8eecbe9445a9483e5", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.8354835386071251, "ground_truth": 0}, {"key": "e00f05efe2038fffc8eaa1e8eecbe9445a9483e5", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.9257686330172434, "ground_truth": 0}, {"key": "e00f05efe2038fffc8eaa1e8eecbe9445a9483e5", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.8856314768431909, "ground_truth": 0}, {"key": "e00f05efe2038fffc8eaa1e8eecbe9445a9483e5", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.764891619472736, "ground_truth": 0}, {"key": "e00f05efe2038fffc8eaa1e8eecbe9445a9483e5", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.8044059174892579, "ground_truth": 0}, {"key": "9ce109dc50fe4eca8b2d0c926d5dbd1df5f49187", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.90465053534342, "ground_truth": 0}, {"key": "9ce109dc50fe4eca8b2d0c926d5dbd1df5f49187", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.8386797551850105, "ground_truth": 0}, {"key": "9ce109dc50fe4eca8b2d0c926d5dbd1df5f49187", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.8479677550856362, "ground_truth": 0}, {"key": "9ce109dc50fe4eca8b2d0c926d5dbd1df5f49187", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.8856314726053839, "ground_truth": 0}, {"key": "9ce109dc50fe4eca8b2d0c926d5dbd1df5f49187", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.8187368006321727, "ground_truth": 0}, {"key": "bbec538b4453859ee9c772c4de8f0eb28acd87c4", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.8080672176619735, "ground_truth": 0}, {"key": "bbec538b4453859ee9c772c4de8f0eb28acd87c4", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.586996430520722, "ground_truth": 0}, {"key": "bbec538b4453859ee9c772c4de8f0eb28acd87c4", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.7786493145995621, "ground_truth": 0}, {"key": "bbec538b4453859ee9c772c4de8f0eb28acd87c4", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.6315942761021609, "ground_truth": 0}, {"key": "bbec538b4453859ee9c772c4de8f0eb28acd87c4", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.5964331230220774, "ground_truth": 0}, {"key": "c4e0587d1b8fcc06c2cc5cfcec42a34d314fbe44", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.9086178986617964, "ground_truth": 0}, {"key": "c4e0587d1b8fcc06c2cc5cfcec42a34d314fbe44", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.9319595766511077, "ground_truth": 0}, {"key": "c4e0587d1b8fcc06c2cc5cfcec42a34d314fbe44", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.9518632304403843, "ground_truth": 0}, {"key": "c4e0587d1b8fcc06c2cc5cfcec42a34d314fbe44", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.921921836764295, "ground_truth": 0}, {"key": "c4e0587d1b8fcc06c2cc5cfcec42a34d314fbe44", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.9358173551656453, "ground_truth": 0}, {"key": "7eaaa5bfe35344ee85eeb871a4d31cd31b12965b", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.9190632924852332, "ground_truth": 0}, {"key": "7eaaa5bfe35344ee85eeb871a4d31cd31b12965b", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.8661325133204686, "ground_truth": 0}, {"key": "7eaaa5bfe35344ee85eeb871a4d31cd31b12965b", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.8080672065396359, "ground_truth": 0}, {"key": "7eaaa5bfe35344ee85eeb871a4d31cd31b12965b", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.7690802362704001, "ground_truth": 0}, {"key": "7eaaa5bfe35344ee85eeb871a4d31cd31b12965b", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.8816149015434629, "ground_truth": 0}, {"key": "9cce7373a54faccf5b5d1232c82afab9b29ab6b9", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.8244619247959833, "ground_truth": 0}, {"key": "9cce7373a54faccf5b5d1232c82afab9b29ab6b9", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.9092645042580707, "ground_truth": 0}, {"key": "9cce7373a54faccf5b5d1232c82afab9b29ab6b9", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.9167080787826336, "ground_truth": 0}, {"key": "9cce7373a54faccf5b5d1232c82afab9b29ab6b9", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.8688267813617531, "ground_truth": 0}, {"key": "9cce7373a54faccf5b5d1232c82afab9b29ab6b9", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.8376199652375239, "ground_truth": 0}, {"key": "1b37e549bbcec859711e5b2ef310e94deed4dc95", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.9579122716737054, "ground_truth": 0}, {"key": "1b37e549bbcec859711e5b2ef310e94deed4dc95", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.9582261204801856, "ground_truth": 0}, {"key": "1b37e549bbcec859711e5b2ef310e94deed4dc95", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.865224072787424, "ground_truth": 0}, {"key": "1b37e549bbcec859711e5b2ef310e94deed4dc95", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.9477691449928404, "ground_truth": 0}, {"key": "1b37e549bbcec859711e5b2ef310e94deed4dc95", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.9669140192589915, "ground_truth": 0}, {"key": "da780ee614304d195bde3b7549313c02990d072e", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.8255897282991741, "ground_truth": 0}, {"key": "da780ee614304d195bde3b7549313c02990d072e", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.9278877977318524, "ground_truth": 0}, {"key": "da780ee614304d195bde3b7549313c02990d072e", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.839733950270883, "ground_truth": 0}, {"key": "da780ee614304d195bde3b7549313c02990d072e", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.7759445479781478, "ground_truth": 0}, {"key": "da780ee614304d195bde3b7549313c02990d072e", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.880797084700607, "ground_truth": 0}, {"key": "e24cdc200182d698a34f564ba71f4948ce6760e5", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.9420819118511103, "ground_truth": 0}, {"key": "e24cdc200182d698a34f564ba71f4948ce6760e5", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.9299510374359943, "ground_truth": 0}, {"key": "e24cdc200182d698a34f564ba71f4948ce6760e5", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.9314625083333247, "ground_truth": 0}, {"key": "e24cdc200182d698a34f564ba71f4948ce6760e5", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.9588471153295611, "ground_truth": 0}, {"key": "e24cdc200182d698a34f564ba71f4948ce6760e5", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.923592321336789, "ground_truth": 0}, {"key": "42483672c204aebcf7ba6e7d6ca4c628fe9a69e7", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.9626731129837811, "ground_truth": 0}, {"key": "42483672c204aebcf7ba6e7d6ca4c628fe9a69e7", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.928926332572201, "ground_truth": 0}, {"key": "42483672c204aebcf7ba6e7d6ca4c628fe9a69e7", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.9525741280551411, "ground_truth": 0}, {"key": "42483672c204aebcf7ba6e7d6ca4c628fe9a69e7", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.9525741312239425, "ground_truth": 0}, {"key": "42483672c204aebcf7ba6e7d6ca4c628fe9a69e7", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.9543079679545726, "ground_truth": 0}, {"key": "3501c83d3dab4a2e4d2142522a4bf1510a64422a", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.8255897265969521, "ground_truth": 0}, {"key": "3501c83d3dab4a2e4d2142522a4bf1510a64422a", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.7943849603379429, "ground_truth": 0}, {"key": "3501c83d3dab4a2e4d2142522a4bf1510a64422a", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.7813306290401245, "ground_truth": 0}, {"key": "3501c83d3dab4a2e4d2142522a4bf1510a64422a", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.7786493166221526, "ground_truth": 0}, {"key": "3501c83d3dab4a2e4d2142522a4bf1510a64422a", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.6992544197805204, "ground_truth": 0}, {"key": "964589248c2d95ac3c734ad71283ca22ae4ecedf", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.781330617904176, "ground_truth": 0}, {"key": "964589248c2d95ac3c734ad71283ca22ae4ecedf", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.8164063839932464, "ground_truth": 0}, {"key": "964589248c2d95ac3c734ad71283ca22ae4ecedf", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.8221891191386959, "ground_truth": 0}, {"key": "964589248c2d95ac3c734ad71283ca22ae4ecedf", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.8233283960034716, "ground_truth": 0}, {"key": "964589248c2d95ac3c734ad71283ca22ae4ecedf", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.8031737838942715, "ground_truth": 0}, {"key": "6b72550a663bcb7a64e242ede6da53b1f585ea71", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.7310585742892882, "ground_truth": 0}, {"key": "6b72550a663bcb7a64e242ede6da53b1f585ea71", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.7826624862791262, "ground_truth": 0}, {"key": "6b72550a663bcb7a64e242ede6da53b1f585ea71", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.6926419595098418, "ground_truth": 0}, {"key": "6b72550a663bcb7a64e242ede6da53b1f585ea71", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.7520125623195485, "ground_truth": 0}, {"key": "6b72550a663bcb7a64e242ede6da53b1f585ea71", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.7341195122292823, "ground_truth": 0}, {"key": "c96bdfc0463d994ddc858ad358fe59371be79352", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.6876300018862743, "ground_truth": 0}, {"key": "c96bdfc0463d994ddc858ad358fe59371be79352", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.8596637391900713, "ground_truth": 0}, {"key": "c96bdfc0463d994ddc858ad358fe59371be79352", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.838679770994227, "ground_truth": 0}, {"key": "c96bdfc0463d994ddc858ad358fe59371be79352", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.5544704822667751, "ground_truth": 0}, {"key": "c96bdfc0463d994ddc858ad358fe59371be79352", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.819893344312679, "ground_truth": 0}, {"key": "085dc5d706487da983655043b144952956cb3c5b", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.515619903326733, "ground_truth": 0}, {"key": "085dc5d706487da983655043b144952956cb3c5b", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.6636689402668319, "ground_truth": 0}, {"key": "085dc5d706487da983655043b144952956cb3c5b", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.7476159497611937, "ground_truth": 0}, {"key": "085dc5d706487da983655043b144952956cb3c5b", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.6460137032382587, "ground_truth": 0}, {"key": "085dc5d706487da983655043b144952956cb3c5b", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.7025300623362956, "ground_truth": 0}, {"key": "1c1dc1da2f6ba045478e25e91c8e1b039ce4cc67", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.8255897155051437, "ground_truth": 0}, {"key": "1c1dc1da2f6ba045478e25e91c8e1b039ce4cc67", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.8740772229090125, "ground_truth": 0}, {"key": "1c1dc1da2f6ba045478e25e91c8e1b039ce4cc67", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.8311430559684745, "ground_truth": 0}, {"key": "1c1dc1da2f6ba045478e25e91c8e1b039ce4cc67", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.6279512156084915, "ground_truth": 0}, {"key": "1c1dc1da2f6ba045478e25e91c8e1b039ce4cc67", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.7839884665957751, "ground_truth": 0}, {"key": "da90eb668bfc66a5e70b2e6631a5ec1c9ffb2413", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.8529354739996131, "ground_truth": 0}, {"key": "da90eb668bfc66a5e70b2e6631a5ec1c9ffb2413", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.6513548516310919, "ground_truth": 0}, {"key": "da90eb668bfc66a5e70b2e6631a5ec1c9ffb2413", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.8104789119469841, "ground_truth": 0}, {"key": "da90eb668bfc66a5e70b2e6631a5ec1c9ffb2413", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.8643104524218235, "ground_truth": 0}, {"key": "da90eb668bfc66a5e70b2e6631a5ec1c9ffb2413", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.8633915924950684, "ground_truth": 0}, {"key": "717b1934db9eb0d7e5e2aef75cd54b29a6530a59", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.786622824469019, "ground_truth": 0}, {"key": "717b1934db9eb0d7e5e2aef75cd54b29a6530a59", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.8092759840063504, "ground_truth": 0}, {"key": "717b1934db9eb0d7e5e2aef75cd54b29a6530a59", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.7676898571011999, "ground_truth": 0}, {"key": "717b1934db9eb0d7e5e2aef75cd54b29a6530a59", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.7799929052162106, "ground_truth": 0}, {"key": "717b1934db9eb0d7e5e2aef75cd54b29a6530a59", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.800692009053633, "ground_truth": 0}, {"key": "e493fe7f282adb10c6b9af18d41f0181f17341e5", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.8529354750696297, "ground_truth": 0}, {"key": "e493fe7f282adb10c6b9af18d41f0181f17341e5", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.7969253824990464, "ground_truth": 0}, {"key": "e493fe7f282adb10c6b9af18d41f0181f17341e5", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.7325918429930447, "ground_truth": 0}, {"key": "e493fe7f282adb10c6b9af18d41f0181f17341e5", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.8816148979095606, "ground_truth": 0}, {"key": "e493fe7f282adb10c6b9af18d41f0181f17341e5", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.8519528037334053, "ground_truth": 0}, {"key": "e510fc72b8ef595e45f1a510d0cad761ae1bd032", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.7718434904247373, "ground_truth": 0}, {"key": "e510fc72b8ef595e45f1a510d0cad761ae1bd032", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.6688802818412094, "ground_truth": 0}, {"key": "e510fc72b8ef595e45f1a510d0cad761ae1bd032", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.5621764841511043, "ground_truth": 0}, {"key": "e510fc72b8ef595e45f1a510d0cad761ae1bd032", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.7106282926737638, "ground_truth": 0}, {"key": "e510fc72b8ef595e45f1a510d0cad761ae1bd032", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.5370414088622135, "ground_truth": 0}, {"key": "564e02cb944ea00c02f9832ab968441b5c67332e", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.8479677450140838, "ground_truth": 0}, {"key": "564e02cb944ea00c02f9832ab968441b5c67332e", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.8577681095073787, "ground_truth": 0}, {"key": "564e02cb944ea00c02f9832ab968441b5c67332e", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.8749346253639041, "ground_truth": 0}, {"key": "564e02cb944ea00c02f9832ab968441b5c67332e", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.8615382073512143, "ground_truth": 0}, {"key": "564e02cb944ea00c02f9832ab968441b5c67332e", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.8354835428912549, "ground_truth": 0}, {"key": "dfd0cea6589cb8be40538b9f165781fbc2c7d796", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.9309620700419735, "ground_truth": 0}, {"key": "dfd0cea6589cb8be40538b9f165781fbc2c7d796", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.8925625318576711, "ground_truth": 0}, {"key": "dfd0cea6589cb8be40538b9f165781fbc2c7d796", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.9224823407455971, "ground_truth": 0}, {"key": "dfd0cea6589cb8be40538b9f165781fbc2c7d796", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.9224823381626106, "ground_truth": 0}, {"key": "dfd0cea6589cb8be40538b9f165781fbc2c7d796", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.9429286003912369, "ground_truth": 0}, {"key": "dbceded6ea7d8a0944ab3f44263f688f644a5c37", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.867933851714825, "ground_truth": 0}, {"key": "dbceded6ea7d8a0944ab3f44263f688f644a5c37", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.9246876936660311, "ground_truth": 0}, {"key": "dbceded6ea7d8a0944ab3f44263f688f644a5c37", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.926835281765236, "ground_truth": 0}, {"key": "dbceded6ea7d8a0944ab3f44263f688f644a5c37", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.9161096117481339, "ground_truth": 0}, {"key": "dbceded6ea7d8a0944ab3f44263f688f644a5c37", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.9304582569261773, "ground_truth": 0}, {"key": "305a7272b28da5bc5574487ca0a09f48b852788c", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.8991213769592379, "ground_truth": 0}, {"key": "305a7272b28da5bc5574487ca0a09f48b852788c", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.894789462078438, "ground_truth": 0}, {"key": "305a7272b28da5bc5574487ca0a09f48b852788c", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.9273632869139968, "ground_truth": 0}, {"key": "305a7272b28da5bc5574487ca0a09f48b852788c", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.8962513713155608, "ground_truth": 0}, {"key": "305a7272b28da5bc5574487ca0a09f48b852788c", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.8652240821684196, "ground_truth": 0}, {"key": "9814600b03458475607fa2e4e9f1637138b7c9bf", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.8031737811781228, "ground_truth": 0}, {"key": "9814600b03458475607fa2e4e9f1637138b7c9bf", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.8333246058771273, "ground_truth": 0}, {"key": "9814600b03458475607fa2e4e9f1637138b7c9bf", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.8128673237037115, "ground_truth": 0}, {"key": "9814600b03458475607fa2e4e9f1637138b7c9bf", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.7505527709357642, "ground_truth": 0}, {"key": "9814600b03458475607fa2e4e9f1637138b7c9bf", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.8848377688376634, "ground_truth": 0}, {"key": "d16bff688345742ee8a1762cb6b82b49e4a065dd", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.8386797647922513, "ground_truth": 0}, {"key": "d16bff688345742ee8a1762cb6b82b49e4a065dd", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.8187367873475513, "ground_truth": 0}, {"key": "d16bff688345742ee8a1762cb6b82b49e4a065dd", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.8459424299400997, "ground_truth": 0}, {"key": "d16bff688345742ee8a1762cb6b82b49e4a065dd", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.8577681127751996, "ground_truth": 0}, {"key": "d16bff688345742ee8a1762cb6b82b49e4a065dd", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.8688267874876561, "ground_truth": 0}, {"key": "c85a7eb698c39c7465d1fe4ebbb50447329b5497", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.9890130569142851, "ground_truth": 0}, {"key": "c85a7eb698c39c7465d1fe4ebbb50447329b5497", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.9902915230385075, "ground_truth": 0}, {"key": "c85a7eb698c39c7465d1fe4ebbb50447329b5497", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.9870795274742921, "ground_truth": 0}, {"key": "c85a7eb698c39c7465d1fe4ebbb50447329b5497", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.9835969675789559, "ground_truth": 0}, {"key": "c85a7eb698c39c7465d1fe4ebbb50447329b5497", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.981735721413735, "ground_truth": 0}, {"key": "5f299d74b492be5e53e6bcf3a54d3c8a4b418a97", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.8175744700737009, "ground_truth": 0}, {"key": "5f299d74b492be5e53e6bcf3a54d3c8a4b418a97", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.8210440989192167, "ground_truth": 0}, {"key": "5f299d74b492be5e53e6bcf3a54d3c8a4b418a97", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.685949442737336, "ground_truth": 0}, {"key": "5f299d74b492be5e53e6bcf3a54d3c8a4b418a97", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.83223666454688, "ground_truth": 0}, {"key": "5f299d74b492be5e53e6bcf3a54d3c8a4b418a97", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.6057990521337379, "ground_truth": 0}, {"key": "5a4e46a4e18d31d1ef4d1087b1643a349f10dd14", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.7248702702899862, "ground_truth": 0}, {"key": "5a4e46a4e18d31d1ef4d1087b1643a349f10dd14", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.9019206819967086, "ground_truth": 0}, {"key": "5a4e46a4e18d31d1ef4d1087b1643a349f10dd14", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.695958326837076, "ground_truth": 0}, {"key": "5a4e46a4e18d31d1ef4d1087b1643a349f10dd14", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.8128673184465194, "ground_truth": 0}, {"key": "5a4e46a4e18d31d1ef4d1087b1643a349f10dd14", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.7170118688059968, "ground_truth": 0}, {"key": "b6b7cbc40f51483708d53416719205f36c06f6df", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.8840392840018967, "ground_truth": 0}, {"key": "b6b7cbc40f51483708d53416719205f36c06f6df", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.8300437529543403, "ground_truth": 0}, {"key": "b6b7cbc40f51483708d53416719205f36c06f6df", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.8499711812099872, "ground_truth": 0}, {"key": "b6b7cbc40f51483708d53416719205f36c06f6df", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.8311430474391934, "ground_truth": 0}, {"key": "b6b7cbc40f51483708d53416719205f36c06f6df", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.7592254101841593, "ground_truth": 0}, {"key": "7c0bda3744be6f7d95eef695e59a4e4001455a35", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.8947894601302301, "ground_truth": 0}, {"key": "7c0bda3744be6f7d95eef695e59a4e4001455a35", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.884039286369616, "ground_truth": 0}, {"key": "7c0bda3744be6f7d95eef695e59a4e4001455a35", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.8832359969400809, "ground_truth": 0}, {"key": "7c0bda3744be6f7d95eef695e59a4e4001455a35", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.8519528103022952, "ground_truth": 0}, {"key": "7c0bda3744be6f7d95eef695e59a4e4001455a35", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.8998277750028328, "ground_truth": 0}, {"key": "f19b17438e69527f376e5d9efc74d19fbac6f755", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.8791467647758866, "ground_truth": 0}, {"key": "f19b17438e69527f376e5d9efc74d19fbac6f755", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.9105453991207922, "ground_truth": 0}, {"key": "f19b17438e69527f376e5d9efc74d19fbac6f755", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.9053222978099128, "ground_truth": 0}, {"key": "f19b17438e69527f376e5d9efc74d19fbac6f755", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.8714748648215506, "ground_truth": 0}, {"key": "f19b17438e69527f376e5d9efc74d19fbac6f755", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.9124361540687899, "ground_truth": 0}, {"key": "eb2fe21af9629392d61a4fabe6cad72130525f2f", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.6513548560862082, "ground_truth": 0}, {"key": "eb2fe21af9629392d61a4fabe6cad72130525f2f", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.7371581447886598, "ground_truth": 0}, {"key": "eb2fe21af9629392d61a4fabe6cad72130525f2f", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.7295197578537503, "ground_truth": 0}, {"key": "eb2fe21af9629392d61a4fabe6cad72130525f2f", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.7310585689315755, "ground_truth": 0}, {"key": "eb2fe21af9629392d61a4fabe6cad72130525f2f", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.6584174767664084, "ground_truth": 0}, {"key": "eebebdc4fa08a6e927ab958a39d91f888550afec", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.834406885917783, "ground_truth": 0}, {"key": "eebebdc4fa08a6e927ab958a39d91f888550afec", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.9019206819967086, "ground_truth": 0}, {"key": "eebebdc4fa08a6e927ab958a39d91f888550afec", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.8407825869379933, "ground_truth": 0}, {"key": "eebebdc4fa08a6e927ab958a39d91f888550afec", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.7745833762354554, "ground_truth": 0}, {"key": "eebebdc4fa08a6e927ab958a39d91f888550afec", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.7563575678535034, "ground_truth": 0}, {"key": "94b15ad6efcd6d47dfcc242135be481fceb7f634", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.7956581039482806, "ground_truth": 0}, {"key": "94b15ad6efcd6d47dfcc242135be481fceb7f634", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.8418256548718335, "ground_truth": 0}, {"key": "94b15ad6efcd6d47dfcc242135be481fceb7f634", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.8428631423625101, "ground_truth": 0}, {"key": "94b15ad6efcd6d47dfcc242135be481fceb7f634", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.8864204075372084, "ground_truth": 0}, {"key": "94b15ad6efcd6d47dfcc242135be481fceb7f634", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.8872045989696274, "ground_truth": 0}, {"key": "504ed83e41a6a861927345f7a027ba53ad02237a", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.9005297940774285, "ground_truth": 0}, {"key": "504ed83e41a6a861927345f7a027ba53ad02237a", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.9367494775931241, "ground_truth": 0}, {"key": "504ed83e41a6a861927345f7a027ba53ad02237a", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.887984042587097, "ground_truth": 0}, {"key": "504ed83e41a6a861927345f7a027ba53ad02237a", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.8816149072738032, "ground_truth": 0}, {"key": "504ed83e41a6a861927345f7a027ba53ad02237a", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.9230391649742838, "ground_truth": 0}, {"key": "42176b852f897ae19ef0cf39d598878c8ff0bced", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.8300437611600578, "ground_truth": 0}, {"key": "42176b852f897ae19ef0cf39d598878c8ff0bced", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.8606036186718125, "ground_truth": 0}, {"key": "42176b852f897ae19ef0cf39d598878c8ff0bced", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.7248702706889768, "ground_truth": 0}, {"key": "42176b852f897ae19ef0cf39d598878c8ff0bced", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.8019358154110212, "ground_truth": 0}, {"key": "42176b852f897ae19ef0cf39d598878c8ff0bced", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.8300437667747883, "ground_truth": 0}, {"key": "62ac534bf7e3e897b2726dddf2b7b6f7723362d4", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.9079671397284593, "ground_truth": 0}, {"key": "62ac534bf7e3e897b2726dddf2b7b6f7723362d4", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.8397339632336804, "ground_truth": 0}, {"key": "62ac534bf7e3e897b2726dddf2b7b6f7723362d4", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.9412234414969248, "ground_truth": 0}, {"key": "62ac534bf7e3e897b2726dddf2b7b6f7723362d4", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.8766343869659129, "ground_truth": 0}, {"key": "62ac534bf7e3e897b2726dddf2b7b6f7723362d4", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.8925625282823495, "ground_truth": 0}, {"key": "4ff05ae8454ad482f81911c5e4275b63466bea35", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.824461931103668, "ground_truth": 0}, {"key": "4ff05ae8454ad482f81911c5e4275b63466bea35", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.9005297867945509, "ground_truth": 0}, {"key": "4ff05ae8454ad482f81911c5e4275b63466bea35", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.8548846351571698, "ground_truth": 0}, {"key": "4ff05ae8454ad482f81911c5e4275b63466bea35", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.8365545613445522, "ground_truth": 0}, {"key": "4ff05ae8454ad482f81911c5e4275b63466bea35", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.9005297877558925, "ground_truth": 0}, {"key": "16e86dc5e3fe27875ee927741542536ea7b7553b", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.8056321949180159, "ground_truth": 0}, {"key": "16e86dc5e3fe27875ee927741542536ea7b7553b", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.9079671404302327, "ground_truth": 0}, {"key": "16e86dc5e3fe27875ee927741542536ea7b7553b", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.806852624685313, "ground_truth": 0}, {"key": "16e86dc5e3fe27875ee927741542536ea7b7553b", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.7969253744101729, "ground_truth": 0}, {"key": "16e86dc5e3fe27875ee927741542536ea7b7553b", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.8807970813696121, "ground_truth": 0}, {"key": "ad55d2f13db6732edcd716e09f527ed2df39946f", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.7866228367227605, "ground_truth": 0}, {"key": "ad55d2f13db6732edcd716e09f527ed2df39946f", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.6242935112200546, "ground_truth": 0}, {"key": "ad55d2f13db6732edcd716e09f527ed2df39946f", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.5926666025485328, "ground_truth": 0}, {"key": "ad55d2f13db6732edcd716e09f527ed2df39946f", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.8198933282841586, "ground_truth": 0}, {"key": "ad55d2f13db6732edcd716e09f527ed2df39946f", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.7732163475445587, "ground_truth": 0}, {"key": "160228fe18f272761b969b08622ba868ad65b206", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.7718435069934688, "ground_truth": 0}, {"key": "160228fe18f272761b969b08622ba868ad65b206", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.7931059453708326, "ground_truth": 0}, {"key": "160228fe18f272761b969b08622ba868ad65b206", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.7279754325884743, "ground_truth": 0}, {"key": "160228fe18f272761b969b08622ba868ad65b206", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.846957847095725, "ground_truth": 0}, {"key": "160228fe18f272761b969b08622ba868ad65b206", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.8397339664052185, "ground_truth": 0}, {"key": "7ebb75bc91aa51d53b06fdbed7feb52d42612065", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.891054956945449, "ground_truth": 0}, {"key": "7ebb75bc91aa51d53b06fdbed7feb52d42612065", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.9284087976242644, "ground_truth": 0}, {"key": "7ebb75bc91aa51d53b06fdbed7feb52d42612065", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.9546474194756599, "ground_truth": 0}, {"key": "7ebb75bc91aa51d53b06fdbed7feb52d42612065", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.934395168740238, "ground_truth": 0}, {"key": "7ebb75bc91aa51d53b06fdbed7feb52d42612065", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.9566342018913897, "ground_truth": 0}, {"key": "a84e31bf36290e557a3080ad297177b6f18cdf84", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.7185944107474325, "ground_truth": 0}, {"key": "a84e31bf36290e557a3080ad297177b6f18cdf84", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.7853085906989017, "ground_truth": 0}, {"key": "a84e31bf36290e557a3080ad297177b6f18cdf84", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.8376199552007134, "ground_truth": 0}, {"key": "a84e31bf36290e557a3080ad297177b6f18cdf84", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.8489721934756026, "ground_truth": 0}, {"key": "a84e31bf36290e557a3080ad297177b6f18cdf84", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.8080672188914253, "ground_truth": 0}, {"key": "c43c7253f38ff2cd79770034ed9af3567cfaa811", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.8210441008284701, "ground_truth": 0}, {"key": "c43c7253f38ff2cd79770034ed9af3567cfaa811", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.8643104548138126, "ground_truth": 0}, {"key": "c43c7253f38ff2cd79770034ed9af3567cfaa811", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.9155072457024841, "ground_truth": 0}, {"key": "c43c7253f38ff2cd79770034ed9af3567cfaa811", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.8969755720917592, "ground_truth": 0}, {"key": "c43c7253f38ff2cd79770034ed9af3567cfaa811", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.8479677512342996, "ground_truth": 0}, {"key": "a4601415eafb5264a4bdc273de3a16365aefb35b", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.8519528094365675, "ground_truth": 0}, {"key": "a4601415eafb5264a4bdc273de3a16365aefb35b", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.8947894679421607, "ground_truth": 0}, {"key": "a4601415eafb5264a4bdc273de3a16365aefb35b", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.9005297837310873, "ground_truth": 0}, {"key": "a4601415eafb5264a4bdc273de3a16365aefb35b", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.8116760133331469, "ground_truth": 0}, {"key": "a4601415eafb5264a4bdc273de3a16365aefb35b", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.9118099605089276, "ground_truth": 0}, {"key": "91d43f137b3d928561fb62b200ae40aee4a34b73", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.9230391587299868, "ground_truth": 0}, {"key": "91d43f137b3d928561fb62b200ae40aee4a34b73", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.9092645124728962, "ground_truth": 0}, {"key": "91d43f137b3d928561fb62b200ae40aee4a34b73", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.8732148387742914, "ground_truth": 0}, {"key": "91d43f137b3d928561fb62b200ae40aee4a34b73", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.9299510396024808, "ground_truth": 0}, {"key": "91d43f137b3d928561fb62b200ae40aee4a34b73", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.9329437145507148, "ground_truth": 0}, {"key": "ab2d99eedfd685ce685fa44e735695c27e946683", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.838679766031551, "ground_truth": 0}, {"key": "ab2d99eedfd685ce685fa44e735695c27e946683", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.7892337024874955, "ground_truth": 0}, {"key": "ab2d99eedfd685ce685fa44e735695c27e946683", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.824461911127718, "ground_truth": 0}, {"key": "ab2d99eedfd685ce685fa44e735695c27e946683", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.8479677536805188, "ground_truth": 0}, {"key": "ab2d99eedfd685ce685fa44e735695c27e946683", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.8840392871560858, "ground_truth": 0}, {"key": "df9c4e1b8698581720b28c71f1e98f82bd6ea6e6", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.90192066821104, "ground_truth": 0}, {"key": "df9c4e1b8698581720b28c71f1e98f82bd6ea6e6", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.885631474791021, "ground_truth": 0}, {"key": "df9c4e1b8698581720b28c71f1e98f82bd6ea6e6", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.8140527903913742, "ground_truth": 0}, {"key": "df9c4e1b8698581720b28c71f1e98f82bd6ea6e6", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.8856314761145357, "ground_truth": 0}, {"key": "df9c4e1b8698581720b28c71f1e98f82bd6ea6e6", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.8714748613457756, "ground_truth": 0}, {"key": "a1d7a119707506100920e1a6f0d9cbf4d4e7c838", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.7620701038117651, "ground_truth": 0}, {"key": "a1d7a119707506100920e1a6f0d9cbf4d4e7c838", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.814052801421331, "ground_truth": 0}, {"key": "a1d7a119707506100920e1a6f0d9cbf4d4e7c838", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.7577943618357517, "ground_truth": 0}, {"key": "a1d7a119707506100920e1a6f0d9cbf4d4e7c838", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.8068526316921395, "ground_truth": 0}, {"key": "a1d7a119707506100920e1a6f0d9cbf4d4e7c838", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.8068526263693973, "ground_truth": 0}, {"key": "acd2b851b367bf62dd603ebff5670ffa9c853a8f", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.858718579172756, "ground_truth": 0}, {"key": "acd2b851b367bf62dd603ebff5670ffa9c853a8f", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.7786493019413243, "ground_truth": 0}, {"key": "acd2b851b367bf62dd603ebff5670ffa9c853a8f", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.8344068737254039, "ground_truth": 0}, {"key": "acd2b851b367bf62dd603ebff5670ffa9c853a8f", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.770464791856926, "ground_truth": 0}, {"key": "acd2b851b367bf62dd603ebff5670ffa9c853a8f", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.8311430497997142, "ground_truth": 0}, {"key": "b9f5a02386adb698ae71cadd3fd1825fa7b998db", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.6688802644812443, "ground_truth": 0}, {"key": "b9f5a02386adb698ae71cadd3fd1825fa7b998db", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.7732163715693712, "ground_truth": 0}, {"key": "b9f5a02386adb698ae71cadd3fd1825fa7b998db", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.6654105542046749, "ground_truth": 0}, {"key": "b9f5a02386adb698ae71cadd3fd1825fa7b998db", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.6388352489003677, "ground_truth": 0}, {"key": "b9f5a02386adb698ae71cadd3fd1825fa7b998db", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.6460137259751237, "ground_truth": 0}, {"key": "c26f356dc536e5797ba550be6e27a95059f1ce53", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.5736784301105586, "ground_truth": 0}, {"key": "c26f356dc536e5797ba550be6e27a95059f1ce53", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.6261241879804547, "ground_truth": 0}, {"key": "c26f356dc536e5797ba550be6e27a95059f1ce53", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.6297746129901681, "ground_truth": 0}, {"key": "c26f356dc536e5797ba550be6e27a95059f1ce53", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.7520125537865218, "ground_truth": 0}, {"key": "c26f356dc536e5797ba550be6e27a95059f1ce53", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.6584174922273573, "ground_truth": 0}, {"key": "94a9883a283e94c3ad53069d98517b08e8853447", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.8509646946002682, "ground_truth": 0}, {"key": "94a9883a283e94c3ad53069d98517b08e8853447", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.8092759808191275, "ground_truth": 0}, {"key": "94a9883a283e94c3ad53069d98517b08e8853447", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.9278878015961016, "ground_truth": 0}, {"key": "94a9883a283e94c3ad53069d98517b08e8853447", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.8210440981910193, "ground_truth": 0}, {"key": "94a9883a283e94c3ad53069d98517b08e8853447", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.7772998494472759, "ground_truth": 0}, {"key": "9c02ebeda5d84859eb36070de7e8a9517ac3fee6", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.9394706133676142, "ground_truth": 0}, {"key": "9c02ebeda5d84859eb36070de7e8a9517ac3fee6", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.9569571504596097, "ground_truth": 0}, {"key": "9c02ebeda5d84859eb36070de7e8a9517ac3fee6", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.9728307668614942, "ground_truth": 0}, {"key": "9c02ebeda5d84859eb36070de7e8a9517ac3fee6", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.9559813458274041, "ground_truth": 0}, {"key": "9c02ebeda5d84859eb36070de7e8a9517ac3fee6", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.9623913655544042, "ground_truth": 0}, {"key": "37ab3a49bb7732e145a24e70e6f077469ca1dbd3", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.9618217227887107, "ground_truth": 0}, {"key": "37ab3a49bb7732e145a24e70e6f077469ca1dbd3", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.9717790132031342, "ground_truth": 0}, {"key": "37ab3a49bb7732e145a24e70e6f077469ca1dbd3", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.9532750423903693, "ground_truth": 0}, {"key": "37ab3a49bb7732e145a24e70e6f077469ca1dbd3", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.9726235116209617, "ground_truth": 0}, {"key": "37ab3a49bb7732e145a24e70e6f077469ca1dbd3", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.9678992931334242, "ground_truth": 0}, {"key": "fa67b52d4597e227947776fd40a4b16f402ed12d", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.8947894661794508, "ground_truth": 0}, {"key": "fa67b52d4597e227947776fd40a4b16f402ed12d", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.862467522926817, "ground_truth": 0}, {"key": "fa67b52d4597e227947776fd40a4b16f402ed12d", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.6495786504855868, "ground_truth": 0}, {"key": "fa67b52d4597e227947776fd40a4b16f402ed12d", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.7718434858712107, "ground_truth": 0}, {"key": "fa67b52d4597e227947776fd40a4b16f402ed12d", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.8679338462538713, "ground_truth": 0}, {"key": "cafb6a9801a85984042abcd7e552d1e129dff4cf", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.79438494710686, "ground_truth": 0}, {"key": "cafb6a9801a85984042abcd7e552d1e129dff4cf", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.7943849572276839, "ground_truth": 0}, {"key": "cafb6a9801a85984042abcd7e552d1e129dff4cf", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.8300437604523176, "ground_truth": 0}, {"key": "cafb6a9801a85984042abcd7e552d1e129dff4cf", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.8529354719257612, "ground_truth": 0}, {"key": "cafb6a9801a85984042abcd7e552d1e129dff4cf", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.8428631528899697, "ground_truth": 0}, {"key": "12a24b1aba082a5fd0687a14015e1e58090ed9c6", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.8587185851824737, "ground_truth": 0}, {"key": "12a24b1aba082a5fd0687a14015e1e58090ed9c6", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.7505527477111463, "ground_truth": 0}, {"key": "12a24b1aba082a5fd0687a14015e1e58090ed9c6", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.8333245871621523, "ground_truth": 0}, {"key": "12a24b1aba082a5fd0687a14015e1e58090ed9c6", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.8278281541362486, "ground_truth": 0}, {"key": "12a24b1aba082a5fd0687a14015e1e58090ed9c6", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.660172378303013, "ground_truth": 0}, {"key": "c8ebf6f48257a704202c7b6df238bc1cbfa838d7", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.8104789087038137, "ground_truth": 0}, {"key": "c8ebf6f48257a704202c7b6df238bc1cbfa838d7", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.8539127590118076, "ground_truth": 0}, {"key": "c8ebf6f48257a704202c7b6df238bc1cbfa838d7", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.903294206400101, "ground_truth": 0}, {"key": "c8ebf6f48257a704202c7b6df238bc1cbfa838d7", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.903294199892183, "ground_truth": 0}, {"key": "c8ebf6f48257a704202c7b6df238bc1cbfa838d7", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.9019206672376535, "ground_truth": 0}, {"key": "48e858dcb8dd62aad328f2c5f7fa052893d7304b", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.6370307864358596, "ground_truth": 0}, {"key": "48e858dcb8dd62aad328f2c5f7fa052893d7304b", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.7520125588223697, "ground_truth": 0}, {"key": "48e858dcb8dd62aad328f2c5f7fa052893d7304b", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.6654105444915634, "ground_truth": 0}, {"key": "48e858dcb8dd62aad328f2c5f7fa052893d7304b", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.6424324958228178, "ground_truth": 0}, {"key": "48e858dcb8dd62aad328f2c5f7fa052893d7304b", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.7994423282193449, "ground_truth": 0}, {"key": "1522da440cb538c8fc60f254efcb65e8378065a1", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.969324201675702, "ground_truth": 0}, {"key": "1522da440cb538c8fc60f254efcb65e8378065a1", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.9257686274882733, "ground_truth": 0}, {"key": "1522da440cb538c8fc60f254efcb65e8378065a1", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.9518632315426478, "ground_truth": 0}, {"key": "1522da440cb538c8fc60f254efcb65e8378065a1", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.9603611586731112, "ground_truth": 0}, {"key": "1522da440cb538c8fc60f254efcb65e8378065a1", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.9420819108465609, "ground_truth": 0}, {"key": "0b40c6061cfd6a745886150c46eb75a7f43b4efa", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.7090191331167831, "ground_truth": 0}, {"key": "0b40c6061cfd6a745886150c46eb75a7f43b4efa", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.8652240869318022, "ground_truth": 0}, {"key": "0b40c6061cfd6a745886150c46eb75a7f43b4efa", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.8577681042056933, "ground_truth": 0}, {"key": "0b40c6061cfd6a745886150c46eb75a7f43b4efa", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.8221891356351773, "ground_truth": 0}, {"key": "0b40c6061cfd6a745886150c46eb75a7f43b4efa", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.8577681170561504, "ground_truth": 0}, {"key": "730655d5d1f29496344388805a891c3e3fd2a64e", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.9263037285677513, "ground_truth": 0}, {"key": "730655d5d1f29496344388805a891c3e3fd2a64e", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.9353465119809622, "ground_truth": 0}, {"key": "730655d5d1f29496344388805a891c3e3fd2a64e", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.95464742180841, "ground_truth": 0}, {"key": "730655d5d1f29496344388805a891c3e3fd2a64e", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.942928600942092, "ground_truth": 0}, {"key": "730655d5d1f29496344388805a891c3e3fd2a64e", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.9329437146920453, "ground_truth": 0}, {"key": "399877dd5e90d151e29ad67fdeb6fa093632e0e1", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.86522408333799, "ground_truth": 0}, {"key": "399877dd5e90d151e29ad67fdeb6fa093632e0e1", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.8386797660097326, "ground_truth": 0}, {"key": "399877dd5e90d151e29ad67fdeb6fa093632e0e1", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.8587185813181408, "ground_truth": 0}, {"key": "399877dd5e90d151e29ad67fdeb6fa093632e0e1", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.8587185811056555, "ground_truth": 0}, {"key": "399877dd5e90d151e29ad67fdeb6fa093632e0e1", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.7813306393971167, "ground_truth": 0}, {"key": "67fc9fa49a2c443dcbab030b9c6247a662716bc9", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.8376199686143945, "ground_truth": 0}, {"key": "67fc9fa49a2c443dcbab030b9c6247a662716bc9", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.7745833877510959, "ground_truth": 0}, {"key": "67fc9fa49a2c443dcbab030b9c6247a662716bc9", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.6825737159236934, "ground_truth": 0}, {"key": "67fc9fa49a2c443dcbab030b9c6247a662716bc9", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.7122321821021277, "ground_truth": 0}, {"key": "67fc9fa49a2c443dcbab030b9c6247a662716bc9", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.8732148368338964, "ground_truth": 0}, {"key": "8a44f223fc67ed0d5f946517f77c2291d6c4a027", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.9092645193376899, "ground_truth": 0}, {"key": "8a44f223fc67ed0d5f946517f77c2291d6c4a027", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.9437636568764977, "ground_truth": 0}, {"key": "8a44f223fc67ed0d5f946517f77c2291d6c4a027", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.8933094028602584, "ground_truth": 0}, {"key": "8a44f223fc67ed0d5f946517f77c2291d6c4a027", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.9213576201560616, "ground_truth": 0}, {"key": "8a44f223fc67ed0d5f946517f77c2291d6c4a027", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.9543079658644001, "ground_truth": 0}, {"key": "a3906e4f27942e2742d5cc9a3241980e338e0d30", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.7217432177166968, "ground_truth": 0}, {"key": "a3906e4f27942e2742d5cc9a3241980e338e0d30", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.7534666562602953, "ground_truth": 0}, {"key": "a3906e4f27942e2742d5cc9a3241980e338e0d30", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.7759445413865815, "ground_truth": 0}, {"key": "a3906e4f27942e2742d5cc9a3241980e338e0d30", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.7170118830446843, "ground_truth": 0}, {"key": "a3906e4f27942e2742d5cc9a3241980e338e0d30", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.7325918635361675, "ground_truth": 0}, {"key": "1e9f089602e8ab42ae65e273d866b53bdf9501bc", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.91550724462895, "ground_truth": 0}, {"key": "1e9f089602e8ab42ae65e273d866b53bdf9501bc", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.8652240777886335, "ground_truth": 0}, {"key": "1e9f089602e8ab42ae65e273d866b53bdf9501bc", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.8902942279688251, "ground_truth": 0}, {"key": "1e9f089602e8ab42ae65e273d866b53bdf9501bc", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.9155072494518129, "ground_truth": 0}, {"key": "1e9f089602e8ab42ae65e273d866b53bdf9501bc", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.9105453990211015, "ground_truth": 0}, {"key": "768682d2f556e103bad77ad7aaa0660181747d1c", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.7892337148730615, "ground_truth": 0}, {"key": "768682d2f556e103bad77ad7aaa0660181747d1c", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.7826624843009128, "ground_truth": 0}, {"key": "768682d2f556e103bad77ad7aaa0660181747d1c", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.8469578452516079, "ground_truth": 0}, {"key": "768682d2f556e103bad77ad7aaa0660181747d1c", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.7704647788338053, "ground_truth": 0}, {"key": "768682d2f556e103bad77ad7aaa0660181747d1c", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.8539127486294693, "ground_truth": 0}, {"key": "2806f716e41ce224a3862eb2bc50e214bc5037d8", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.9142907180923382, "ground_truth": 0}, {"key": "2806f716e41ce224a3862eb2bc50e214bc5037d8", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.9425067250572505, "ground_truth": 0}, {"key": "2806f716e41ce224a3862eb2bc50e214bc5037d8", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.937668963756449, "ground_truth": 0}, {"key": "2806f716e41ce224a3862eb2bc50e214bc5037d8", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.9167080698227462, "ground_truth": 0}, {"key": "2806f716e41ce224a3862eb2bc50e214bc5037d8", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.9669140228181461, "ground_truth": 0}, {"key": "49d1a193a2c477f5861b593f06681b35b0e49573", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.9059898170306112, "ground_truth": 0}, {"key": "49d1a193a2c477f5861b593f06681b35b0e49573", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.830043771570624, "ground_truth": 0}, {"key": "49d1a193a2c477f5861b593f06681b35b0e49573", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.9092645210108432, "ground_truth": 0}, {"key": "49d1a193a2c477f5861b593f06681b35b0e49573", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.8438951018339003, "ground_truth": 0}, {"key": "49d1a193a2c477f5861b593f06681b35b0e49573", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.7866228183386765, "ground_truth": 0}, {"key": "d603649af5260edbbe0474bcbb2e83e7340372d3", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.8376199701295519, "ground_truth": 0}, {"key": "d603649af5260edbbe0474bcbb2e83e7340372d3", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.8918110472789237, "ground_truth": 0}, {"key": "d603649af5260edbbe0474bcbb2e83e7340372d3", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.9026095995769023, "ground_truth": 0}, {"key": "d603649af5260edbbe0474bcbb2e83e7340372d3", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.9507778877089154, "ground_truth": 0}, {"key": "d603649af5260edbbe0474bcbb2e83e7340372d3", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.8998277800153788, "ground_truth": 0}, {"key": "241c3bfcde3e19fb8f0e5d0273ccb06155a2d86b", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.7690802267573857, "ground_truth": 0}, {"key": "241c3bfcde3e19fb8f0e5d0273ccb06155a2d86b", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.6943026827638893, "ground_truth": 0}, {"key": "241c3bfcde3e19fb8f0e5d0273ccb06155a2d86b", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.763483772907895, "ground_truth": 0}, {"key": "241c3bfcde3e19fb8f0e5d0273ccb06155a2d86b", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.7310585914074875, "ground_truth": 0}, {"key": "241c3bfcde3e19fb8f0e5d0273ccb06155a2d86b", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.6774739996803099, "ground_truth": 0}, {"key": "cc8898d831bb770da703c284d4a811f16cb4035b", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.7461389763976086, "ground_truth": 0}, {"key": "cc8898d831bb770da703c284d4a811f16cb4035b", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.7577943735177566, "ground_truth": 0}, {"key": "cc8898d831bb770da703c284d4a811f16cb4035b", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.583203370951331, "ground_truth": 0}, {"key": "cc8898d831bb770da703c284d4a811f16cb4035b", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.8104789164582824, "ground_truth": 0}, {"key": "cc8898d831bb770da703c284d4a811f16cb4035b", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.7170118586299733, "ground_truth": 0}, {"key": "e5685719d330bf84ed7691a9a591e04e6a6226b8", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.7233094752837417, "ground_truth": 0}, {"key": "e5685719d330bf84ed7691a9a591e04e6a6226b8", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.6774739896147314, "ground_truth": 0}, {"key": "e5685719d330bf84ed7691a9a591e04e6a6226b8", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.7606506559610118, "ground_truth": 0}, {"key": "e5685719d330bf84ed7691a9a591e04e6a6226b8", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.7918210632929268, "ground_truth": 0}, {"key": "e5685719d330bf84ed7691a9a591e04e6a6226b8", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.8587185970785726, "ground_truth": 0}, {"key": "bc868bcd37d2463875c4c685c582449069992a76", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.7956581010027876, "ground_truth": 0}, {"key": "bc868bcd37d2463875c4c685c582449069992a76", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.7386690761841859, "ground_truth": 0}, {"key": "bc868bcd37d2463875c4c685c582449069992a76", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.6406358617231829, "ground_truth": 0}, {"key": "bc868bcd37d2463875c4c685c582449069992a76", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.7839884526579488, "ground_truth": 0}, {"key": "bc868bcd37d2463875c4c685c582449069992a76", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.6671476566929004, "ground_truth": 0}, {"key": "c6369011986d295ce197e7304e14b207dab4c0aa", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.7279754407826354, "ground_truth": 0}, {"key": "c6369011986d295ce197e7304e14b207dab4c0aa", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.7981867727197308, "ground_truth": 0}, {"key": "c6369011986d295ce197e7304e14b207dab4c0aa", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.8848377608052447, "ground_truth": 0}, {"key": "c6369011986d295ce197e7304e14b207dab4c0aa", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.7106282951432247, "ground_truth": 0}, {"key": "c6369011986d295ce197e7304e14b207dab4c0aa", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.7325918380255111, "ground_truth": 0}, {"key": "c4e4f565d15f76b1e367d4fc2e7a2648c3cd395c", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.6876299990251401, "ground_truth": 0}, {"key": "c4e4f565d15f76b1e367d4fc2e7a2648c3cd395c", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.7431680121946275, "ground_truth": 0}, {"key": "c4e4f565d15f76b1e367d4fc2e7a2648c3cd395c", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.6774740096862232, "ground_truth": 0}, {"key": "c4e4f565d15f76b1e367d4fc2e7a2648c3cd395c", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.8031737950299813, "ground_truth": 0}, {"key": "c4e4f565d15f76b1e367d4fc2e7a2648c3cd395c", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.8128673042418018, "ground_truth": 0}, {"key": "32fe9f0f2eedaf63c9fd0314ab92c4b46297e260", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.6406358625760872, "ground_truth": 0}, {"key": "32fe9f0f2eedaf63c9fd0314ab92c4b46297e260", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.7325918410273554, "ground_truth": 0}, {"key": "32fe9f0f2eedaf63c9fd0314ab92c4b46297e260", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.713830747297185, "ground_truth": 0}, {"key": "32fe9f0f2eedaf63c9fd0314ab92c4b46297e260", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.6584174978770845, "ground_truth": 0}, {"key": "32fe9f0f2eedaf63c9fd0314ab92c4b46297e260", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.7325918429973908, "ground_truth": 0}, {"key": "41698f361bcf6415f711719ed0c2f6817205c091", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.9278877995567123, "ground_truth": 0}, {"key": "41698f361bcf6415f711719ed0c2f6817205c091", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.8732148277775625, "ground_truth": 0}, {"key": "41698f361bcf6415f711719ed0c2f6817205c091", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.8933094098485567, "ground_truth": 0}, {"key": "41698f361bcf6415f711719ed0c2f6817205c091", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.9367494760488211, "ground_truth": 0}, {"key": "41698f361bcf6415f711719ed0c2f6817205c091", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.9358173546779658, "ground_truth": 0}, {"key": "f040d657ee146cd131d34aeb31d6728b4f996666", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.8652240892321239, "ground_truth": 0}, {"key": "f040d657ee146cd131d34aeb31d6728b4f996666", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.5331544135239814, "ground_truth": 0}, {"key": "f040d657ee146cd131d34aeb31d6728b4f996666", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.7648916166966353, "ground_truth": 0}, {"key": "f040d657ee146cd131d34aeb31d6728b4f996666", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.8872045975101337, "ground_truth": 0}, {"key": "f040d657ee146cd131d34aeb31d6728b4f996666", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.7943849468685089, "ground_truth": 0}, {"key": "1823e1e750046606e4be0e8710f1d74998783e41", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.8210441195880575, "ground_truth": 0}, {"key": "1823e1e750046606e4be0e8710f1d74998783e41", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.8428631411990969, "ground_truth": 0}, {"key": "1823e1e750046606e4be0e8710f1d74998783e41", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.8428631431901951, "ground_truth": 0}, {"key": "1823e1e750046606e4be0e8710f1d74998783e41", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.8255897199050137, "ground_truth": 0}, {"key": "1823e1e750046606e4be0e8710f1d74998783e41", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.8278281509727635, "ground_truth": 0}, {"key": "6fae638166ee95509fbab3b28ac1c0ba0b088c79", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.8879840446789258, "ground_truth": 0}, {"key": "6fae638166ee95509fbab3b28ac1c0ba0b088c79", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.91180995010659, "ground_truth": 0}, {"key": "6fae638166ee95509fbab3b28ac1c0ba0b088c79", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.8128673127728648, "ground_truth": 0}, {"key": "6fae638166ee95509fbab3b28ac1c0ba0b088c79", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.8344068920141764, "ground_truth": 0}, {"key": "6fae638166ee95509fbab3b28ac1c0ba0b088c79", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.8529354720677829, "ground_truth": 0}, {"key": "00be40289d0aea65afd2da6431db8a9fc8efc9c0", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.9339146286490749, "ground_truth": 0}, {"key": "00be40289d0aea65afd2da6431db8a9fc8efc9c0", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.8705972671477644, "ground_truth": 0}, {"key": "00be40289d0aea65afd2da6431db8a9fc8efc9c0", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.6992544173138598, "ground_truth": 0}, {"key": "00be40289d0aea65afd2da6431db8a9fc8efc9c0", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.8354835494824333, "ground_truth": 0}, {"key": "00be40289d0aea65afd2da6431db8a9fc8efc9c0", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.8428631403177406, "ground_truth": 0}, {"key": "50dc0ca6cbbd4f9c3761fbb3ad9e7d7ba85bd9b3", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.8080672423641204, "ground_truth": 0}, {"key": "50dc0ca6cbbd4f9c3761fbb3ad9e7d7ba85bd9b3", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.9026096048071676, "ground_truth": 0}, {"key": "50dc0ca6cbbd4f9c3761fbb3ad9e7d7ba85bd9b3", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.9032942062724333, "ground_truth": 0}, {"key": "50dc0ca6cbbd4f9c3761fbb3ad9e7d7ba85bd9b3", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.9046505411459521, "ground_truth": 0}, {"key": "50dc0ca6cbbd4f9c3761fbb3ad9e7d7ba85bd9b3", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.8587185746418269, "ground_truth": 0}, {"key": "28b0e5240a7c3088fc62a70628b146bb40b6b853", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.9746286875225354, "ground_truth": 0}, {"key": "28b0e5240a7c3088fc62a70628b146bb40b6b853", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.9805806521481841, "ground_truth": 0}, {"key": "28b0e5240a7c3088fc62a70628b146bb40b6b853", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.9738443821333577, "ground_truth": 0}, {"key": "28b0e5240a7c3088fc62a70628b146bb40b6b853", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.9709092437447628, "ground_truth": 0}, {"key": "28b0e5240a7c3088fc62a70628b146bb40b6b853", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.985271386504301, "ground_truth": 0}, {"key": "44bdf9aa9712197110017fca533785653210f1ea", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.8895288452483626, "ground_truth": 0}, {"key": "44bdf9aa9712197110017fca533785653210f1ea", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.8864204108026336, "ground_truth": 0}, {"key": "44bdf9aa9712197110017fca533785653210f1ea", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.8679338510519645, "ground_truth": 0}, {"key": "44bdf9aa9712197110017fca533785653210f1ea", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.9178933762621747, "ground_truth": 0}, {"key": "44bdf9aa9712197110017fca533785653210f1ea", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.9235923193689389, "ground_truth": 0}, {"key": "879e68a2b78b3cf3f5c2581bbf6093871143ed7b", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.931462511229509, "ground_truth": 0}, {"key": "879e68a2b78b3cf3f5c2581bbf6093871143ed7b", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.9142907177799701, "ground_truth": 0}, {"key": "879e68a2b78b3cf3f5c2581bbf6093871143ed7b", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.9059898224408306, "ground_truth": 0}, {"key": "879e68a2b78b3cf3f5c2581bbf6093871143ed7b", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.9376689685160164, "ground_truth": 0}, {"key": "879e68a2b78b3cf3f5c2581bbf6093871143ed7b", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.8991213846738051, "ground_truth": 0}, {"key": "980051ddbf137ec06e7aeead2acb598bae388520", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.8175744808649483, "ground_truth": 0}, {"key": "980051ddbf137ec06e7aeead2acb598bae388520", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.8104789104623862, "ground_truth": 0}, {"key": "980051ddbf137ec06e7aeead2acb598bae388520", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.8438951009668207, "ground_truth": 0}, {"key": "980051ddbf137ec06e7aeead2acb598bae388520", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.7185943929894103, "ground_truth": 0}, {"key": "980051ddbf137ec06e7aeead2acb598bae388520", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.840782604797299, "ground_truth": 0}, {"key": "45b9fb89ac2724f2d7de56b2f8c9397bca03326e", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.9099070103531735, "ground_truth": 0}, {"key": "45b9fb89ac2724f2d7de56b2f8c9397bca03326e", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.9202179872171656, "ground_truth": 0}, {"key": "45b9fb89ac2724f2d7de56b2f8c9397bca03326e", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.9412234390277111, "ground_truth": 0}, {"key": "45b9fb89ac2724f2d7de56b2f8c9397bca03326e", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.929440397111467, "ground_truth": 0}, {"key": "45b9fb89ac2724f2d7de56b2f8c9397bca03326e", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.9453993935346722, "ground_truth": 0}, {"key": "b427165e1be5e9b6e6067fc5f6591c02bfb93333", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.8714748631491129, "ground_truth": 0}, {"key": "b427165e1be5e9b6e6067fc5f6591c02bfb93333", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.8092759710198548, "ground_truth": 0}, {"key": "b427165e1be5e9b6e6067fc5f6591c02bfb93333", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.8300437545384353, "ground_truth": 0}, {"key": "b427165e1be5e9b6e6067fc5f6591c02bfb93333", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.8596637491963198, "ground_truth": 0}, {"key": "b427165e1be5e9b6e6067fc5f6591c02bfb93333", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.8791467752048743, "ground_truth": 0}, {"key": "a9a2880bd65c6b3835d19987ebcbd3d09010a0c3", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.7356416432982497, "ground_truth": 0}, {"key": "a9a2880bd65c6b3835d19987ebcbd3d09010a0c3", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.7704647949887858, "ground_truth": 0}, {"key": "a9a2880bd65c6b3835d19987ebcbd3d09010a0c3", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.8311430500542099, "ground_truth": 0}, {"key": "a9a2880bd65c6b3835d19987ebcbd3d09010a0c3", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.7563575306219353, "ground_truth": 0}, {"key": "a9a2880bd65c6b3835d19987ebcbd3d09010a0c3", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.7931059567319205, "ground_truth": 0}, {"key": "0c67e8d5a91f3c7d9c53e29b8d0a25cf8db21b54", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.7813306332213494, "ground_truth": 0}, {"key": "0c67e8d5a91f3c7d9c53e29b8d0a25cf8db21b54", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.9019206779785014, "ground_truth": 0}, {"key": "0c67e8d5a91f3c7d9c53e29b8d0a25cf8db21b54", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.7786493178069708, "ground_truth": 0}, {"key": "0c67e8d5a91f3c7d9c53e29b8d0a25cf8db21b54", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.8519528163795198, "ground_truth": 0}, {"key": "0c67e8d5a91f3c7d9c53e29b8d0a25cf8db21b54", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.8633915941027858, "ground_truth": 0}, {"key": "bc1c4d12aabdcecab3d87c6f9a898e41c7cd3821", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.8300437766608106, "ground_truth": 0}, {"key": "bc1c4d12aabdcecab3d87c6f9a898e41c7cd3821", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.7994423245264594, "ground_truth": 0}, {"key": "bc1c4d12aabdcecab3d87c6f9a898e41c7cd3821", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.9278878021428503, "ground_truth": 0}, {"key": "bc1c4d12aabdcecab3d87c6f9a898e41c7cd3821", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.8233283944580286, "ground_truth": 0}, {"key": "bc1c4d12aabdcecab3d87c6f9a898e41c7cd3821", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.8289388105785853, "ground_truth": 0}, {"key": "7b76a0b5e6006587b65ad70ac2e4953ca1e2d4d1", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.826711802678003, "ground_truth": 0}, {"key": "7b76a0b5e6006587b65ad70ac2e4953ca1e2d4d1", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.8019358091107274, "ground_truth": 0}, {"key": "7b76a0b5e6006587b65ad70ac2e4953ca1e2d4d1", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.7025300607139248, "ground_truth": 0}, {"key": "7b76a0b5e6006587b65ad70ac2e4953ca1e2d4d1", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.7799929029755985, "ground_truth": 0}, {"key": "7b76a0b5e6006587b65ad70ac2e4953ca1e2d4d1", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.7057850200837564, "ground_truth": 0}, {"key": "8a0976b5b0811c919669e8aed7274e1d0fa14679", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.8816149014525467, "ground_truth": 0}, {"key": "8a0976b5b0811c919669e8aed7274e1d0fa14679", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.9477691435047965, "ground_truth": 0}, {"key": "8a0976b5b0811c919669e8aed7274e1d0fa14679", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.9235923166159035, "ground_truth": 0}, {"key": "8a0976b5b0811c919669e8aed7274e1d0fa14679", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.8624675300184919, "ground_truth": 0}, {"key": "8a0976b5b0811c919669e8aed7274e1d0fa14679", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.924141819413181, "ground_truth": 0}, {"key": "69788d586d71bf36d2818ca097308747f6ab25ab", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.9289263324672413, "ground_truth": 0}, {"key": "69788d586d71bf36d2818ca097308747f6ab25ab", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.8774767872261032, "ground_truth": 0}, {"key": "69788d586d71bf36d2818ca097308747f6ab25ab", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.8872045967062678, "ground_truth": 0}, {"key": "69788d586d71bf36d2818ca097308747f6ab25ab", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.8397339708306232, "ground_truth": 0}, {"key": "69788d586d71bf36d2818ca097308747f6ab25ab", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.9445872077865961, "ground_truth": 0}, {"key": "82e9c77478dfed129ceca1a152ba54e20f7f5a88", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.824461930046486, "ground_truth": 0}, {"key": "82e9c77478dfed129ceca1a152ba54e20f7f5a88", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.8856314720290396, "ground_truth": 0}, {"key": "82e9c77478dfed129ceca1a152ba54e20f7f5a88", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.879974368430297, "ground_truth": 0}, {"key": "82e9c77478dfed129ceca1a152ba54e20f7f5a88", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.845942430351764, "ground_truth": 0}, {"key": "82e9c77478dfed129ceca1a152ba54e20f7f5a88", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.7931059396959859, "ground_truth": 0}, {"key": "e1b904fd0a3f74c3e01831acb6d4a67c0d1b642b", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.7416740282351114, "ground_truth": 0}, {"key": "e1b904fd0a3f74c3e01831acb6d4a67c0d1b642b", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.8548846434302302, "ground_truth": 0}, {"key": "e1b904fd0a3f74c3e01831acb6d4a67c0d1b642b", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.760650654361206, "ground_truth": 0}, {"key": "e1b904fd0a3f74c3e01831acb6d4a67c0d1b642b", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.8418256411449383, "ground_truth": 0}, {"key": "e1b904fd0a3f74c3e01831acb6d4a67c0d1b642b", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.834406876446335, "ground_truth": 0}, {"key": "1cecb5f24805afcc15eb5cfa0500130f107c8bcb", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.6076631678892729, "ground_truth": 0}, {"key": "1cecb5f24805afcc15eb5cfa0500130f107c8bcb", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.7839884674908957, "ground_truth": 0}, {"key": "1cecb5f24805afcc15eb5cfa0500130f107c8bcb", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.7732163833946872, "ground_truth": 0}, {"key": "1cecb5f24805afcc15eb5cfa0500130f107c8bcb", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.7233094588727365, "ground_truth": 0}, {"key": "1cecb5f24805afcc15eb5cfa0500130f107c8bcb", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.7416739988732957, "ground_truth": 0}, {"key": "d3da69405b687367de6260d74db8726423b6884a", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.909264519081785, "ground_truth": 0}, {"key": "d3da69405b687367de6260d74db8726423b6884a", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.9549844661566651, "ground_truth": 0}, {"key": "d3da69405b687367de6260d74db8726423b6884a", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.8489722035028467, "ground_truth": 0}, {"key": "d3da69405b687367de6260d74db8726423b6884a", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.9142907230087762, "ground_truth": 0}, {"key": "d3da69405b687367de6260d74db8726423b6884a", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.9324533065106366, "ground_truth": 0}, {"key": "9b7836ba179053fecec671168589694bd4ba08f1", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.9549844688541739, "ground_truth": 0}, {"key": "9b7836ba179053fecec671168589694bd4ba08f1", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.9462003537528352, "ground_truth": 0}, {"key": "9b7836ba179053fecec671168589694bd4ba08f1", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.9643214464818368, "ground_truth": 0}, {"key": "9b7836ba179053fecec671168589694bd4ba08f1", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.9704646623718557, "ground_truth": 0}, {"key": "9b7836ba179053fecec671168589694bd4ba08f1", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.9536217941806931, "ground_truth": 0}, {"key": "9483ae6d83dd71a96e91eee727a9ce7c0f3cf6ab", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.965641314103713, "ground_truth": 0}, {"key": "9483ae6d83dd71a96e91eee727a9ce7c0f3cf6ab", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.9536217990830709, "ground_truth": 0}, {"key": "9483ae6d83dd71a96e91eee727a9ce7c0f3cf6ab", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.9640516766753435, "ground_truth": 0}, {"key": "9483ae6d83dd71a96e91eee727a9ce7c0f3cf6ab", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.9873750510922192, "ground_truth": 0}, {"key": "9483ae6d83dd71a96e91eee727a9ce7c0f3cf6ab", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.965119114111519, "ground_truth": 0}, {"key": "ea29e498c303964fc39c856ddf7037d5dfbc93fb", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.8469578426443279, "ground_truth": 0}, {"key": "ea29e498c303964fc39c856ddf7037d5dfbc93fb", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.8976952954062557, "ground_truth": 0}, {"key": "ea29e498c303964fc39c856ddf7037d5dfbc93fb", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.9343951633378408, "ground_truth": 0}, {"key": "ea29e498c303964fc39c856ddf7037d5dfbc93fb", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.8848377727032452, "ground_truth": 0}, {"key": "ea29e498c303964fc39c856ddf7037d5dfbc93fb", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.9489172599998045, "ground_truth": 0}, {"key": "e1aad9da59a32a4443010b092eba1b68725c8467", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.6893056269650029, "ground_truth": 0}, {"key": "e1aad9da59a32a4443010b092eba1b68725c8467", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.7676898560627509, "ground_truth": 0}, {"key": "e1aad9da59a32a4443010b092eba1b68725c8467", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.7476159538956018, "ground_truth": 0}, {"key": "e1aad9da59a32a4443010b092eba1b68725c8467", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.7905303212932149, "ground_truth": 0}, {"key": "e1aad9da59a32a4443010b092eba1b68725c8467", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.7732163715415024, "ground_truth": 0}, {"key": "6897f34c8e510dc95524dbfceefe20717776f761", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.9005297877696348, "ground_truth": 0}, {"key": "6897f34c8e510dc95524dbfceefe20717776f761", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.7520125634640638, "ground_truth": 0}, {"key": "6897f34c8e510dc95524dbfceefe20717776f761", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.7248702617648984, "ground_truth": 0}, {"key": "6897f34c8e510dc95524dbfceefe20717776f761", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.8749346264706008, "ground_truth": 0}, {"key": "6897f34c8e510dc95524dbfceefe20717776f761", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.8056321767461738, "ground_truth": 0}, {"key": "c0846f0148c9fd60433c8d2bf85e3437b49f9ec4", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.6926419807595401, "ground_truth": 0}, {"key": "c0846f0148c9fd60433c8d2bf85e3437b49f9ec4", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.8006919947707463, "ground_truth": 0}, {"key": "c0846f0148c9fd60433c8d2bf85e3437b49f9ec4", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.7853085706837124, "ground_truth": 0}, {"key": "c0846f0148c9fd60433c8d2bf85e3437b49f9ec4", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.8198933234644874, "ground_truth": 0}, {"key": "c0846f0148c9fd60433c8d2bf85e3437b49f9ec4", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.7549149901228234, "ground_truth": 0}, {"key": "dfbb5a2d5844f89537141a2b5a48040e68327010", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.8333245860308944, "ground_truth": 0}, {"key": "dfbb5a2d5844f89537141a2b5a48040e68327010", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.8757869963717909, "ground_truth": 0}, {"key": "dfbb5a2d5844f89537141a2b5a48040e68327010", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.8418256552137574, "ground_truth": 0}, {"key": "dfbb5a2d5844f89537141a2b5a48040e68327010", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.8210440979735686, "ground_truth": 0}, {"key": "dfbb5a2d5844f89537141a2b5a48040e68327010", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.8856314726581704, "ground_truth": 0}, {"key": "0aa0562353120d93357dc00a05ff4d2bc0312715", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.7879311883287685, "ground_truth": 0}, {"key": "0aa0562353120d93357dc00a05ff4d2bc0312715", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.7446563569386343, "ground_truth": 0}, {"key": "0aa0562353120d93357dc00a05ff4d2bc0312715", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.7461389968193696, "ground_truth": 0}, {"key": "0aa0562353120d93357dc00a05ff4d2bc0312715", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.8428631480653721, "ground_truth": 0}, {"key": "0aa0562353120d93357dc00a05ff4d2bc0312715", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.7879311958765512, "ground_truth": 0}, {"key": "fd5ae29a3ed2e9093c12dcbb12fcb5c67217b0f5", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.9005297913256346, "ground_truth": 0}, {"key": "fd5ae29a3ed2e9093c12dcbb12fcb5c67217b0f5", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.8962513712856018, "ground_truth": 0}, {"key": "fd5ae29a3ed2e9093c12dcbb12fcb5c67217b0f5", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.905989816099778, "ground_truth": 0}, {"key": "fd5ae29a3ed2e9093c12dcbb12fcb5c67217b0f5", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.8895288553429153, "ground_truth": 0}, {"key": "fd5ae29a3ed2e9093c12dcbb12fcb5c67217b0f5", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.9241418224237378, "ground_truth": 0}, {"key": "4df7a53f5e24347a53d5bf3b8c92bef21561f2c4", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.7534666590058713, "ground_truth": 0}, {"key": "4df7a53f5e24347a53d5bf3b8c92bef21561f2c4", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.8006919903459748, "ground_truth": 0}, {"key": "4df7a53f5e24347a53d5bf3b8c92bef21561f2c4", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.687630003307835, "ground_truth": 0}, {"key": "4df7a53f5e24347a53d5bf3b8c92bef21561f2c4", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.6619228695465504, "ground_truth": 0}, {"key": "4df7a53f5e24347a53d5bf3b8c92bef21561f2c4", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.8198933565204446, "ground_truth": 0}, {"key": "166fe0c3d3f400a48ec5fd716c675384512f152c", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.8670357578181298, "ground_truth": 0}, {"key": "166fe0c3d3f400a48ec5fd716c675384512f152c", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.8832359878467738, "ground_truth": 0}, {"key": "166fe0c3d3f400a48ec5fd716c675384512f152c", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.8577681139966505, "ground_truth": 0}, {"key": "166fe0c3d3f400a48ec5fd716c675384512f152c", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.7969253672130674, "ground_truth": 0}, {"key": "166fe0c3d3f400a48ec5fd716c675384512f152c", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.931959581688005, "ground_truth": 0}, {"key": "69e313e0e6e7603f96a3783cb7d1ada68ace288f", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.9257686320118514, "ground_truth": 0}, {"key": "69e313e0e6e7603f96a3783cb7d1ada68ace288f", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.7931059507730693, "ground_truth": 0}, {"key": "69e313e0e6e7603f96a3783cb7d1ada68ace288f", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.823328401039325, "ground_truth": 0}, {"key": "69e313e0e6e7603f96a3783cb7d1ada68ace288f", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.8679338467309955, "ground_truth": 0}, {"key": "69e313e0e6e7603f96a3783cb7d1ada68ace288f", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.795658097271414, "ground_truth": 0}, {"key": "21ff7b91537b3ab2e73dff1f982a669b8658b0e9", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.6460136913626922, "ground_truth": 0}, {"key": "21ff7b91537b3ab2e73dff1f982a669b8658b0e9", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.6636689500663114, "ground_truth": 0}, {"key": "21ff7b91537b3ab2e73dff1f982a669b8658b0e9", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.7476159508298427, "ground_truth": 0}, {"key": "21ff7b91537b3ab2e73dff1f982a669b8658b0e9", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.7648916046830299, "ground_truth": 0}, {"key": "21ff7b91537b3ab2e73dff1f982a669b8658b0e9", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.7279754512526064, "ground_truth": 0}, {"key": "963cbc7820b42eaa7b7a82d178c6a387a70a6a3c", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.8438951157694011, "ground_truth": 0}, {"key": "963cbc7820b42eaa7b7a82d178c6a387a70a6a3c", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.7233094668000073, "ground_truth": 0}, {"key": "963cbc7820b42eaa7b7a82d178c6a387a70a6a3c", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.6825737159331885, "ground_truth": 0}, {"key": "963cbc7820b42eaa7b7a82d178c6a387a70a6a3c", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.845942442200897, "ground_truth": 0}, {"key": "963cbc7820b42eaa7b7a82d178c6a387a70a6a3c", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.809275977061212, "ground_truth": 0}, {"key": "8180a77657661e975e3fac6c7fdbd8de97fd160e", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.9600626860747432, "ground_truth": 0}, {"key": "8180a77657661e975e3fac6c7fdbd8de97fd160e", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.9529258230365817, "ground_truth": 0}, {"key": "8180a77657661e975e3fac6c7fdbd8de97fd160e", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.9549844698858623, "ground_truth": 0}, {"key": "8180a77657661e975e3fac6c7fdbd8de97fd160e", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.9529258270616459, "ground_truth": 0}, {"key": "8180a77657661e975e3fac6c7fdbd8de97fd160e", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.9697854134351053, "ground_truth": 0}, {"key": "6c498fd6de7ad5e5006732655050c1d97cc2af68", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.8856314749464615, "ground_truth": 0}, {"key": "6c498fd6de7ad5e5006732655050c1d97cc2af68", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.7505527587951777, "ground_truth": 0}, {"key": "6c498fd6de7ad5e5006732655050c1d97cc2af68", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.8140527914995874, "ground_truth": 0}, {"key": "6c498fd6de7ad5e5006732655050c1d97cc2af68", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.8670357471490796, "ground_truth": 0}, {"key": "6c498fd6de7ad5e5006732655050c1d97cc2af68", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.7386690687992247, "ground_truth": 0}, {"key": "fdb54e157f8f4e5a479dbc6288587e52fffde33f", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.8840392843517306, "ground_truth": 0}, {"key": "fdb54e157f8f4e5a479dbc6288587e52fffde33f", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.8080672034426455, "ground_truth": 0}, {"key": "fdb54e157f8f4e5a479dbc6288587e52fffde33f", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.7866228281252091, "ground_truth": 0}, {"key": "fdb54e157f8f4e5a479dbc6288587e52fffde33f", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.8895288499551285, "ground_truth": 0}, {"key": "fdb54e157f8f4e5a479dbc6288587e52fffde33f", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.8519528091262971, "ground_truth": 0}, {"key": "fc8f0e54e2627ebe705735f0565d77ca64579d92", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.6976089353806421, "ground_truth": 0}, {"key": "fc8f0e54e2627ebe705735f0565d77ca64579d92", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.7106282868242763, "ground_truth": 0}, {"key": "fc8f0e54e2627ebe705735f0565d77ca64579d92", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.7676898505007503, "ground_truth": 0}, {"key": "fc8f0e54e2627ebe705735f0565d77ca64579d92", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.8397339601611267, "ground_truth": 0}, {"key": "fc8f0e54e2627ebe705735f0565d77ca64579d92", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.6757646011463797, "ground_truth": 0}, {"key": "b000d4eac990440e136dc1e655a03d5669531d9b", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.8548846337545049, "ground_truth": 0}, {"key": "b000d4eac990440e136dc1e655a03d5669531d9b", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.7138307512623666, "ground_truth": 0}, {"key": "b000d4eac990440e136dc1e655a03d5669531d9b", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.9059898260433085, "ground_truth": 0}, {"key": "b000d4eac990440e136dc1e655a03d5669531d9b", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.8499711725740096, "ground_truth": 0}, {"key": "b000d4eac990440e136dc1e655a03d5669531d9b", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.8799743718997705, "ground_truth": 0}, {"key": "1064c47f3d7f0efa03368fe7eb01dd0836017339", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.8840392850536238, "ground_truth": 0}, {"key": "1064c47f3d7f0efa03368fe7eb01dd0836017339", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.8848377618325549, "ground_truth": 0}, {"key": "1064c47f3d7f0efa03368fe7eb01dd0836017339", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.9005297909298973, "ground_truth": 0}, {"key": "1064c47f3d7f0efa03368fe7eb01dd0836017339", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.8840392895593826, "ground_truth": 0}, {"key": "1064c47f3d7f0efa03368fe7eb01dd0836017339", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.8459424467879243, "ground_truth": 0}, {"key": "d79f1e9a2ddfcb61d80c944de53daebd4b5c7f6e", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.7745833722539055, "ground_truth": 0}, {"key": "d79f1e9a2ddfcb61d80c944de53daebd4b5c7f6e", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.8152324958599845, "ground_truth": 0}, {"key": "d79f1e9a2ddfcb61d80c944de53daebd4b5c7f6e", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.6943026472495423, "ground_truth": 0}, {"key": "d79f1e9a2ddfcb61d80c944de53daebd4b5c7f6e", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.746139005716001, "ground_truth": 0}, {"key": "d79f1e9a2ddfcb61d80c944de53daebd4b5c7f6e", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.8479677671668234, "ground_truth": 0}, {"key": "87b5f1f872c849ec239bad4ccf487d048d4274b2", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.919063292627217, "ground_truth": 0}, {"key": "87b5f1f872c849ec239bad4ccf487d048d4274b2", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.9304582594650072, "ground_truth": 0}, {"key": "87b5f1f872c849ec239bad4ccf487d048d4274b2", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.936285005165355, "ground_truth": 0}, {"key": "87b5f1f872c849ec239bad4ccf487d048d4274b2", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.9124361567615829, "ground_truth": 0}, {"key": "87b5f1f872c849ec239bad4ccf487d048d4274b2", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.9381240105046815, "ground_truth": 0}, {"key": "9ea6d6a5cae86243c1c8899f7bab76e874c73b38", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.7690802364351544, "ground_truth": 0}, {"key": "9ea6d6a5cae86243c1c8899f7bab76e874c73b38", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.7879311941264077, "ground_truth": 0}, {"key": "9ea6d6a5cae86243c1c8899f7bab76e874c73b38", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.7745833812236853, "ground_truth": 0}, {"key": "9ea6d6a5cae86243c1c8899f7bab76e874c73b38", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.8791467701557645, "ground_truth": 0}, {"key": "9ea6d6a5cae86243c1c8899f7bab76e874c73b38", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.8418256454931705, "ground_truth": 0}, {"key": "a3cb529364dbdcd2af9e30ecfe56898be375870b", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.8895288496063164, "ground_truth": 0}, {"key": "a3cb529364dbdcd2af9e30ecfe56898be375870b", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.9073122216217435, "ground_truth": 0}, {"key": "a3cb529364dbdcd2af9e30ecfe56898be375870b", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.8661325030176718, "ground_truth": 0}, {"key": "a3cb529364dbdcd2af9e30ecfe56898be375870b", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.899121369658764, "ground_truth": 0}, {"key": "a3cb529364dbdcd2af9e30ecfe56898be375870b", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.8918110402594583, "ground_truth": 0}, {"key": "f489b07406c653968a0ed21c00e28c9124e4a49b", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.9289263296960116, "ground_truth": 0}, {"key": "f489b07406c653968a0ed21c00e28c9124e4a49b", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.8407825975897678, "ground_truth": 0}, {"key": "f489b07406c653968a0ed21c00e28c9124e4a49b", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.8969755715327374, "ground_truth": 0}, {"key": "f489b07406c653968a0ed21c00e28c9124e4a49b", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.9086178956532489, "ground_truth": 0}, {"key": "f489b07406c653968a0ed21c00e28c9124e4a49b", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.8289387994689109, "ground_truth": 0}, {"key": "499fdb9bf024f6fbfd605792594372df22ec12f0", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.7310585552706104, "ground_truth": 0}, {"key": "499fdb9bf024f6fbfd605792594372df22ec12f0", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.814052801421331, "ground_truth": 0}, {"key": "499fdb9bf024f6fbfd605792594372df22ec12f0", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.8056321695523294, "ground_truth": 0}, {"key": "499fdb9bf024f6fbfd605792594372df22ec12f0", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.8991213839180083, "ground_truth": 0}, {"key": "499fdb9bf024f6fbfd605792594372df22ec12f0", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.7799928974437015, "ground_truth": 0}, {"key": "9f49bf7ded4308f1601e4723d594d7c3b4883b32", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.8210441075453382, "ground_truth": 0}, {"key": "9f49bf7ded4308f1601e4723d594d7c3b4883b32", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.6859494788902751, "ground_truth": 0}, {"key": "9f49bf7ded4308f1601e4723d594d7c3b4883b32", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.7799929051940637, "ground_truth": 0}, {"key": "9f49bf7ded4308f1601e4723d594d7c3b4883b32", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.9046505393234722, "ground_truth": 0}, {"key": "9f49bf7ded4308f1601e4723d594d7c3b4883b32", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.8548846412780541, "ground_truth": 0}, {"key": "6bd843fe975d42b0f2d5eedb1a02d918e4a397f5", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.885631486730171, "ground_truth": 0}, {"key": "6bd843fe975d42b0f2d5eedb1a02d918e4a397f5", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.8344069005257354, "ground_truth": 0}, {"key": "6bd843fe975d42b0f2d5eedb1a02d918e4a397f5", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.853912763872464, "ground_truth": 0}, {"key": "6bd843fe975d42b0f2d5eedb1a02d918e4a397f5", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.8459424425087007, "ground_truth": 0}, {"key": "6bd843fe975d42b0f2d5eedb1a02d918e4a397f5", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.8807970859121598, "ground_truth": 0}, {"key": "00aa8e3ba59f5fe71a096a5549f80faece10aa83", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.8044059118060781, "ground_truth": 0}, {"key": "00aa8e3ba59f5fe71a096a5549f80faece10aa83", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.8116760158248469, "ground_truth": 0}, {"key": "00aa8e3ba59f5fe71a096a5549f80faece10aa83", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.8152324890895818, "ground_truth": 0}, {"key": "00aa8e3ba59f5fe71a096a5549f80faece10aa83", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.7549149911192067, "ground_truth": 0}, {"key": "00aa8e3ba59f5fe71a096a5549f80faece10aa83", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.7981867770927081, "ground_truth": 0}, {"key": "bf0ea0373655184f69fb01b9aa833d21e7188e9e", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.8615382038602022, "ground_truth": 0}, {"key": "bf0ea0373655184f69fb01b9aa833d21e7188e9e", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.875786990581717, "ground_truth": 0}, {"key": "bf0ea0373655184f69fb01b9aa833d21e7188e9e", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.8519528051465646, "ground_truth": 0}, {"key": "bf0ea0373655184f69fb01b9aa833d21e7188e9e", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.8322366477392744, "ground_truth": 0}, {"key": "bf0ea0373655184f69fb01b9aa833d21e7188e9e", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.8864204168088078, "ground_truth": 0}, {"key": "e1afe080ecf3565b0103214c21f49e8b03741024", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.8221891142260851, "ground_truth": 0}, {"key": "e1afe080ecf3565b0103214c21f49e8b03741024", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.779992894038466, "ground_truth": 0}, {"key": "e1afe080ecf3565b0103214c21f49e8b03741024", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.7690802479862621, "ground_truth": 0}, {"key": "e1afe080ecf3565b0103214c21f49e8b03741024", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.8255897055046375, "ground_truth": 0}, {"key": "e1afe080ecf3565b0103214c21f49e8b03741024", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.7356416345423368, "ground_truth": 0}, {"key": "05fa6152f08a3d64745030124428775768ee3afd", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.9235923172708124, "ground_truth": 0}, {"key": "05fa6152f08a3d64745030124428775768ee3afd", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.9678992930609217, "ground_truth": 0}, {"key": "05fa6152f08a3d64745030124428775768ee3afd", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.9445872090681678, "ground_truth": 0}, {"key": "05fa6152f08a3d64745030124428775768ee3afd", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.9381240108342511, "ground_truth": 0}, {"key": "05fa6152f08a3d64745030124428775768ee3afd", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.9489172644301265, "ground_truth": 0}, {"key": "8f80054060e5c2dde57666b5e3bddf6b70b34f3f", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.6859494595079081, "ground_truth": 0}, {"key": "8f80054060e5c2dde57666b5e3bddf6b70b34f3f", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.8548846497408064, "ground_truth": 0}, {"key": "8f80054060e5c2dde57666b5e3bddf6b70b34f3f", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.8459424391803324, "ground_truth": 0}, {"key": "8f80054060e5c2dde57666b5e3bddf6b70b34f3f", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.901227407861475, "ground_truth": 0}, {"key": "8f80054060e5c2dde57666b5e3bddf6b70b34f3f", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.7356416442519115, "ground_truth": 0}, {"key": "f63877ffefceaf9a2a13a9277f4d861f9b9b8a73", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.8984105501647608, "ground_truth": 0}, {"key": "f63877ffefceaf9a2a13a9277f4d861f9b9b8a73", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.8418256389408656, "ground_truth": 0}, {"key": "f63877ffefceaf9a2a13a9277f4d861f9b9b8a73", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.804405929292225, "ground_truth": 0}, {"key": "f63877ffefceaf9a2a13a9277f4d861f9b9b8a73", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.8140528004447635, "ground_truth": 0}, {"key": "f63877ffefceaf9a2a13a9277f4d861f9b9b8a73", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.8902942262221638, "ground_truth": 0}, {"key": "e1e0fbee1f5df559fda3830710afb660f33cb7b5", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.7577943886593015, "ground_truth": 0}, {"key": "e1e0fbee1f5df559fda3830710afb660f33cb7b5", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.5926666233484011, "ground_truth": 0}, {"key": "e1e0fbee1f5df559fda3830710afb660f33cb7b5", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.5195213487812399, "ground_truth": 0}, {"key": "e1e0fbee1f5df559fda3830710afb660f33cb7b5", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.7170118912799328, "ground_truth": 0}, {"key": "e1e0fbee1f5df559fda3830710afb660f33cb7b5", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.6132365608931144, "ground_truth": 0}, {"key": "7d66246dc75062c5616067bbb379962c3934e52f", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.9161096116072728, "ground_truth": 0}, {"key": "7d66246dc75062c5616067bbb379962c3934e52f", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.8068526224723626, "ground_truth": 0}, {"key": "7d66246dc75062c5616067bbb379962c3934e52f", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.893309402089338, "ground_truth": 0}, {"key": "7d66246dc75062c5616067bbb379962c3934e52f", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.876634389857379, "ground_truth": 0}, {"key": "7d66246dc75062c5616067bbb379962c3934e52f", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.9178933722340634, "ground_truth": 0}, {"key": "09e62b334425ef4eee26be483a625858c91340eb", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.8643104493210382, "ground_truth": 0}, {"key": "09e62b334425ef4eee26be483a625858c91340eb", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.8902942246618386, "ground_truth": 0}, {"key": "09e62b334425ef4eee26be483a625858c91340eb", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.8019358225268536, "ground_truth": 0}, {"key": "09e62b334425ef4eee26be483a625858c91340eb", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.886420420361984, "ground_truth": 0}, {"key": "09e62b334425ef4eee26be483a625858c91340eb", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.7879312054115754, "ground_truth": 0}, {"key": "32e769b0ced3ffbf79f695af69a2401897156c8c", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.881614903558805, "ground_truth": 0}, {"key": "32e769b0ced3ffbf79f695af69a2401897156c8c", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.832236657588744, "ground_truth": 0}, {"key": "32e769b0ced3ffbf79f695af69a2401897156c8c", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.8840392776654851, "ground_truth": 0}, {"key": "32e769b0ced3ffbf79f695af69a2401897156c8c", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.895522680846637, "ground_truth": 0}, {"key": "32e769b0ced3ffbf79f695af69a2401897156c8c", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.9136765280820034, "ground_truth": 0}, {"key": "43d42fe40ada4406377bc3b45c123a75552c21a0", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.8407826014132601, "ground_truth": 0}, {"key": "43d42fe40ada4406377bc3b45c123a75552c21a0", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.7918210531205956, "ground_truth": 0}, {"key": "43d42fe40ada4406377bc3b45c123a75552c21a0", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.7826624855489406, "ground_truth": 0}, {"key": "43d42fe40ada4406377bc3b45c123a75552c21a0", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.8365545776480765, "ground_truth": 0}, {"key": "43d42fe40ada4406377bc3b45c123a75552c21a0", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.8116760069881223, "ground_truth": 0}, {"key": "cec3e977a612e1481913d63934cfe578b9bcf3be", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.9142907238859453, "ground_truth": 0}, {"key": "cec3e977a612e1481913d63934cfe578b9bcf3be", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.9543079682049205, "ground_truth": 0}, {"key": "cec3e977a612e1481913d63934cfe578b9bcf3be", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.9334308074246574, "ground_truth": 0}, {"key": "cec3e977a612e1481913d63934cfe578b9bcf3be", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.946990228124531, "ground_truth": 0}, {"key": "cec3e977a612e1481913d63934cfe578b9bcf3be", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.8670357616458267, "ground_truth": 0}, {"key": "2572185d9544f23c4ad02aeac1ae8ab7828fb4be", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.7704648072538847, "ground_truth": 0}, {"key": "2572185d9544f23c4ad02aeac1ae8ab7828fb4be", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.8910549535053148, "ground_truth": 0}, {"key": "2572185d9544f23c4ad02aeac1ae8ab7828fb4be", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.8289388014611049, "ground_truth": 0}, {"key": "2572185d9544f23c4ad02aeac1ae8ab7828fb4be", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.7853085656088524, "ground_truth": 0}, {"key": "2572185d9544f23c4ad02aeac1ae8ab7828fb4be", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.8198933395069151, "ground_truth": 0}, {"key": "3cc7c9639fb87922cfac315fbb55641e671a3d99", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.9105453985376778, "ground_truth": 0}, {"key": "3cc7c9639fb87922cfac315fbb55641e671a3d99", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.8749346125137827, "ground_truth": 0}, {"key": "3cc7c9639fb87922cfac315fbb55641e671a3d99", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.8679338505793913, "ground_truth": 0}, {"key": "3cc7c9639fb87922cfac315fbb55641e671a3d99", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.8354835461484467, "ground_truth": 0}, {"key": "3cc7c9639fb87922cfac315fbb55641e671a3d99", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.8333246004131933, "ground_truth": 0}, {"key": "374ae10f9cbb0719c889321f880a0671892336e4", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.9289263339874326, "ground_truth": 0}, {"key": "374ae10f9cbb0719c889321f880a0671892336e4", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.9353465125742472, "ground_truth": 0}, {"key": "374ae10f9cbb0719c889321f880a0671892336e4", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.9196425371023657, "ground_truth": 0}, {"key": "374ae10f9cbb0719c889321f880a0671892336e4", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.9268352803723139, "ground_truth": 0}, {"key": "374ae10f9cbb0719c889321f880a0671892336e4", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.9329437134674291, "ground_truth": 0}, {"key": "89a7bb5a0b120c5b50e9145c8f8f9bea3a90371a", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.9263037277429269, "ground_truth": 0}, {"key": "89a7bb5a0b120c5b50e9145c8f8f9bea3a90371a", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.8879840447549798, "ground_truth": 0}, {"key": "89a7bb5a0b120c5b50e9145c8f8f9bea3a90371a", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.9118099541914098, "ground_truth": 0}, {"key": "89a7bb5a0b120c5b50e9145c8f8f9bea3a90371a", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.9556514201221773, "ground_truth": 0}, {"key": "89a7bb5a0b120c5b50e9145c8f8f9bea3a90371a", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.92630373067383, "ground_truth": 0}, {"key": "49d4ad731a44b7576e3e3271b1eee2f0219883c2", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.8187367875627589, "ground_truth": 0}, {"key": "49d4ad731a44b7576e3e3271b1eee2f0219883c2", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.8633916134782983, "ground_truth": 0}, {"key": "49d4ad731a44b7576e3e3271b1eee2f0219883c2", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.866132511753855, "ground_truth": 0}, {"key": "49d4ad731a44b7576e3e3271b1eee2f0219883c2", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.8386797786711204, "ground_truth": 0}, {"key": "49d4ad731a44b7576e3e3271b1eee2f0219883c2", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.783988448915488, "ground_truth": 0}, {"key": "ab3c9bac8bcfef89da719c4aba8ea4eee71e4daf", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.9481545307315566, "ground_truth": 0}, {"key": "ab3c9bac8bcfef89da719c4aba8ea4eee71e4daf", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.9556514183464546, "ground_truth": 0}, {"key": "ab3c9bac8bcfef89da719c4aba8ea4eee71e4daf", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.9219218322468131, "ground_truth": 0}, {"key": "ab3c9bac8bcfef89da719c4aba8ea4eee71e4daf", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.923039158955141, "ground_truth": 0}, {"key": "ab3c9bac8bcfef89da719c4aba8ea4eee71e4daf", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.9196425368789767, "ground_truth": 0}, {"key": "eb8b1cf7cf4ab7ad23ef6094cfe69348563aecc8", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.9149009587558546, "ground_truth": 0}, {"key": "eb8b1cf7cf4ab7ad23ef6094cfe69348563aecc8", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.93146250891493, "ground_truth": 0}, {"key": "eb8b1cf7cf4ab7ad23ef6094cfe69348563aecc8", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.8376199742969981, "ground_truth": 0}, {"key": "eb8b1cf7cf4ab7ad23ef6094cfe69348563aecc8", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.9105453960274476, "ground_truth": 0}, {"key": "eb8b1cf7cf4ab7ad23ef6094cfe69348563aecc8", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.8991213802599389, "ground_truth": 0}, {"key": "e944a5cbd4265e43f422c172b930a60b7de190cc", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.8128673146762905, "ground_truth": 0}, {"key": "e944a5cbd4265e43f422c172b930a60b7de190cc", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.8044059186170397, "ground_truth": 0}, {"key": "e944a5cbd4265e43f422c172b930a60b7de190cc", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.6926419925590831, "ground_truth": 0}, {"key": "e944a5cbd4265e43f422c172b930a60b7de190cc", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.710628301504461, "ground_truth": 0}, {"key": "e944a5cbd4265e43f422c172b930a60b7de190cc", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.6548947088038013, "ground_truth": 0}, {"key": "ef96a6c54daaf4fef676a69305e26fa1d4788bdd", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.8128673145384867, "ground_truth": 0}, {"key": "ef96a6c54daaf4fef676a69305e26fa1d4788bdd", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.8519528150164748, "ground_truth": 0}, {"key": "ef96a6c54daaf4fef676a69305e26fa1d4788bdd", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.8031737849483608, "ground_truth": 0}, {"key": "ef96a6c54daaf4fef676a69305e26fa1d4788bdd", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.8596637469337751, "ground_truth": 0}, {"key": "ef96a6c54daaf4fef676a69305e26fa1d4788bdd", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.8255897219064222, "ground_truth": 0}, {"key": "d9ec8c3e50de1d5af4524c26c6819e17b64090aa", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.8128673115498452, "ground_truth": 0}, {"key": "d9ec8c3e50de1d5af4524c26c6819e17b64090aa", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.7994423207998042, "ground_truth": 0}, {"key": "d9ec8c3e50de1d5af4524c26c6819e17b64090aa", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.7676898498586435, "ground_truth": 0}, {"key": "d9ec8c3e50de1d5af4524c26c6819e17b64090aa", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.7718435043540718, "ground_truth": 0}, {"key": "d9ec8c3e50de1d5af4524c26c6819e17b64090aa", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.7138307640177638, "ground_truth": 0}, {"key": "b6072611b97e8c19ba2d7e0dfce153f046dd629d", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.7490872107771012, "ground_truth": 0}, {"key": "b6072611b97e8c19ba2d7e0dfce153f046dd629d", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.6206215941750152, "ground_truth": 0}, {"key": "b6072611b97e8c19ba2d7e0dfce153f046dd629d", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.8019358276169991, "ground_truth": 0}, {"key": "b6072611b97e8c19ba2d7e0dfce153f046dd629d", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.8697145754335832, "ground_truth": 0}, {"key": "b6072611b97e8c19ba2d7e0dfce153f046dd629d", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.6513548708655237, "ground_truth": 0}, {"key": "2cf81cee664ebcb027a48259e34e512a79aceecb", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.8962513763109635, "ground_truth": 0}, {"key": "2cf81cee664ebcb027a48259e34e512a79aceecb", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.9167080820858717, "ground_truth": 0}, {"key": "2cf81cee664ebcb027a48259e34e512a79aceecb", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.9399133514607076, "ground_truth": 0}, {"key": "2cf81cee664ebcb027a48259e34e512a79aceecb", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.903974509730215, "ground_truth": 0}, {"key": "2cf81cee664ebcb027a48259e34e512a79aceecb", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.9284087947815344, "ground_truth": 0}, {"key": "b037b44fc06a2d89d95dc7b4453b87371a34fe2f", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.9118099556453931, "ground_truth": 0}, {"key": "b037b44fc06a2d89d95dc7b4453b87371a34fe2f", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.8879840447549798, "ground_truth": 0}, {"key": "b037b44fc06a2d89d95dc7b4453b87371a34fe2f", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.8799743681196993, "ground_truth": 0}, {"key": "b037b44fc06a2d89d95dc7b4453b87371a34fe2f", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.9299510379881671, "ground_truth": 0}, {"key": "b037b44fc06a2d89d95dc7b4453b87371a34fe2f", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.9343951667114816, "ground_truth": 0}, {"key": "b1ea881f21e2b58e247b5894d4f259cf86b4d1dd", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.8723473767174779, "ground_truth": 0}, {"key": "b1ea881f21e2b58e247b5894d4f259cf86b4d1dd", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.8799743644879092, "ground_truth": 0}, {"key": "b1ea881f21e2b58e247b5894d4f259cf86b4d1dd", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.9099070007286627, "ground_truth": 0}, {"key": "b1ea881f21e2b58e247b5894d4f259cf86b4d1dd", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.894789462971749, "ground_truth": 0}, {"key": "b1ea881f21e2b58e247b5894d4f259cf86b4d1dd", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.8679338389888576, "ground_truth": 0}, {"key": "d80e6a3be826df05df00a87f49cc426fd597f085", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.9746286878309012, "ground_truth": 0}, {"key": "d80e6a3be826df05df00a87f49cc426fd597f085", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.9773707994093755, "ground_truth": 0}, {"key": "d80e6a3be826df05df00a87f49cc426fd597f085", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.9651191117515507, "ground_truth": 0}, {"key": "d80e6a3be826df05df00a87f49cc426fd597f085", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.9730365006256886, "ground_truth": 0}, {"key": "d80e6a3be826df05df00a87f49cc426fd597f085", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.9822877030971883, "ground_truth": 0}, {"key": "05216d3837745866d393f0e07be7ba801dc330f6", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.8848377821345563, "ground_truth": 0}, {"key": "05216d3837745866d393f0e07be7ba801dc330f6", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.9230391581859217, "ground_truth": 0}, {"key": "05216d3837745866d393f0e07be7ba801dc330f6", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.9437636549430595, "ground_truth": 0}, {"key": "05216d3837745866d393f0e07be7ba801dc330f6", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.9235923215630585, "ground_truth": 0}, {"key": "05216d3837745866d393f0e07be7ba801dc330f6", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.9155072428178979, "ground_truth": 0}, {"key": "a204e3551445183cf53ae355e532a2db731c0c30", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.8816149024322504, "ground_truth": 0}, {"key": "a204e3551445183cf53ae355e532a2db731c0c30", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.853912751531274, "ground_truth": 0}, {"key": "a204e3551445183cf53ae355e532a2db731c0c30", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.8449215301778193, "ground_truth": 0}, {"key": "a204e3551445183cf53ae355e532a2db731c0c30", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.9425067244218414, "ground_truth": 0}, {"key": "a204e3551445183cf53ae355e532a2db731c0c30", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.8365545625851097, "ground_truth": 0}, {"key": "047e7bc4c7ea5f7df08d4efc443ac8a3479649f1", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.8998277750778356, "ground_truth": 0}, {"key": "047e7bc4c7ea5f7df08d4efc443ac8a3479649f1", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.9257686316032618, "ground_truth": 0}, {"key": "047e7bc4c7ea5f7df08d4efc443ac8a3479649f1", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.8187367930565304, "ground_truth": 0}, {"key": "047e7bc4c7ea5f7df08d4efc443ac8a3479649f1", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.9268352778353001, "ground_truth": 0}, {"key": "047e7bc4c7ea5f7df08d4efc443ac8a3479649f1", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.8925625236328678, "ground_truth": 0}, {"key": "dee467e11f253e70ec843c45fb373da06eace6be", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.9019206792409613, "ground_truth": 0}, {"key": "dee467e11f253e70ec843c45fb373da06eace6be", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.925229963599892, "ground_truth": 0}, {"key": "dee467e11f253e70ec843c45fb373da06eace6be", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.9412234450633008, "ground_truth": 0}, {"key": "dee467e11f253e70ec843c45fb373da06eace6be", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.8925625329813608, "ground_truth": 0}, {"key": "dee467e11f253e70ec843c45fb373da06eace6be", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.9190632871629743, "ground_truth": 0}, {"key": "054891b9199a73152564cc5be925250ea282bb00", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.8697145853478263, "ground_truth": 0}, {"key": "054891b9199a73152564cc5be925250ea282bb00", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.83223665037466, "ground_truth": 0}, {"key": "054891b9199a73152564cc5be925250ea282bb00", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.8955226847651028, "ground_truth": 0}, {"key": "054891b9199a73152564cc5be925250ea282bb00", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.8643104571839948, "ground_truth": 0}, {"key": "054891b9199a73152564cc5be925250ea282bb00", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.8633915966522107, "ground_truth": 0}, {"key": "82a94cf607660eb67aac057e3f5028c4cae75abf", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.8902942255859532, "ground_truth": 0}, {"key": "82a94cf607660eb67aac057e3f5028c4cae75abf", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.8489722088114197, "ground_truth": 0}, {"key": "82a94cf607660eb67aac057e3f5028c4cae75abf", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.837619973664953, "ground_truth": 0}, {"key": "82a94cf607660eb67aac057e3f5028c4cae75abf", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.9092645190891507, "ground_truth": 0}, {"key": "82a94cf607660eb67aac057e3f5028c4cae75abf", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.8652240767095314, "ground_truth": 0}, {"key": "58bf14c936eb7e9a6561599014fefd77ef6c457e", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.9748211570948933, "ground_truth": 0}, {"key": "58bf14c936eb7e9a6561599014fefd77ef6c457e", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.9425067205514792, "ground_truth": 0}, {"key": "58bf14c936eb7e9a6561599014fefd77ef6c457e", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.9734434258652978, "ground_truth": 0}, {"key": "58bf14c936eb7e9a6561599014fefd77ef6c457e", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.9477691435276192, "ground_truth": 0}, {"key": "58bf14c936eb7e9a6561599014fefd77ef6c457e", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.9273632922859972, "ground_truth": 0}, {"key": "5574fe023e3127f0c206ac89eb06abf5a7400438", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.756357542150488, "ground_truth": 0}, {"key": "5574fe023e3127f0c206ac89eb06abf5a7400438", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.7371581511033442, "ground_truth": 0}, {"key": "5574fe023e3127f0c206ac89eb06abf5a7400438", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.7745833853810656, "ground_truth": 0}, {"key": "5574fe023e3127f0c206ac89eb06abf5a7400438", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.7461389962009467, "ground_truth": 0}, {"key": "5574fe023e3127f0c206ac89eb06abf5a7400438", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.7356416319835788, "ground_truth": 0}, {"key": "e88be1fa30cb6557d422788b5c469b7ba7ca8bfc", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.9433475768370047, "ground_truth": 0}, {"key": "e88be1fa30cb6557d422788b5c469b7ba7ca8bfc", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.9458012715154027, "ground_truth": 0}, {"key": "e88be1fa30cb6557d422788b5c469b7ba7ca8bfc", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.86060361718431, "ground_truth": 0}, {"key": "e88be1fa30cb6557d422788b5c469b7ba7ca8bfc", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.929951039675729, "ground_truth": 0}, {"key": "e88be1fa30cb6557d422788b5c469b7ba7ca8bfc", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.9441768588575439, "ground_truth": 0}, {"key": "62f05476ec5198ceb345ce4f45d7d0e70f499ad7", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.8799743635774956, "ground_truth": 0}, {"key": "62f05476ec5198ceb345ce4f45d7d0e70f499ad7", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.8840392833894896, "ground_truth": 0}, {"key": "62f05476ec5198ceb345ce4f45d7d0e70f499ad7", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.9012274023596154, "ground_truth": 0}, {"key": "62f05476ec5198ceb345ce4f45d7d0e70f499ad7", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.8697145793721786, "ground_truth": 0}, {"key": "62f05476ec5198ceb345ce4f45d7d0e70f499ad7", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.8774767880203338, "ground_truth": 0}, {"key": "8cc719f761556a81a71c2dd1b703749c2059df10", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.7732163611566646, "ground_truth": 0}, {"key": "8cc719f761556a81a71c2dd1b703749c2059df10", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.8872045930997333, "ground_truth": 0}, {"key": "8cc719f761556a81a71c2dd1b703749c2059df10", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.7892337040990932, "ground_truth": 0}, {"key": "8cc719f761556a81a71c2dd1b703749c2059df10", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.8311430339821984, "ground_truth": 0}, {"key": "8cc719f761556a81a71c2dd1b703749c2059df10", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.8991213846744539, "ground_truth": 0}, {"key": "2d89b0d0827a0a1e9e855de7717407cdff63b1f5", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.6315943260511958, "ground_truth": 0}, {"key": "2d89b0d0827a0a1e9e855de7717407cdff63b1f5", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.6388352900873202, "ground_truth": 0}, {"key": "2d89b0d0827a0a1e9e855de7717407cdff63b1f5", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.6477981807298551, "ground_truth": 0}, {"key": "2d89b0d0827a0a1e9e855de7717407cdff63b1f5", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.658417480938172, "ground_truth": 0}, {"key": "2d89b0d0827a0a1e9e855de7717407cdff63b1f5", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.6224593352239872, "ground_truth": 0}, {"key": "41431356e1e7c6f94057b262cd284987f9edb184", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.779992900341031, "ground_truth": 0}, {"key": "41431356e1e7c6f94057b262cd284987f9edb184", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.7853085895113663, "ground_truth": 0}, {"key": "41431356e1e7c6f94057b262cd284987f9edb184", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.7648916068571522, "ground_truth": 0}, {"key": "41431356e1e7c6f94057b262cd284987f9edb184", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.8255897194245558, "ground_truth": 0}, {"key": "41431356e1e7c6f94057b262cd284987f9edb184", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.7956580899426632, "ground_truth": 0}, {"key": "50872fa30632af8f4c65fb9f952ea8e1b13043c9", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.8643104578152246, "ground_truth": 0}, {"key": "50872fa30632af8f4c65fb9f952ea8e1b13043c9", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.7233094672151761, "ground_truth": 0}, {"key": "50872fa30632af8f4c65fb9f952ea8e1b13043c9", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.7690802475165798, "ground_truth": 0}, {"key": "50872fa30632af8f4c65fb9f952ea8e1b13043c9", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.8568122916977644, "ground_truth": 0}, {"key": "50872fa30632af8f4c65fb9f952ea8e1b13043c9", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.8633916012794511, "ground_truth": 0}, {"key": "4a403faad8116c40f4cb960d3ffad081106341ad", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.7534666453304031, "ground_truth": 0}, {"key": "4a403faad8116c40f4cb960d3ffad081106341ad", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.7264255997804057, "ground_truth": 0}, {"key": "4a403faad8116c40f4cb960d3ffad081106341ad", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.7008948208086464, "ground_truth": 0}, {"key": "4a403faad8116c40f4cb960d3ffad081106341ad", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.8104789043235651, "ground_truth": 0}, {"key": "4a403faad8116c40f4cb960d3ffad081106341ad", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.6909762928964701, "ground_truth": 0}, {"key": "6f6964470c122807573653173b45b8e00bb59696", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.9661559685638546, "ground_truth": 0}, {"key": "6f6964470c122807573653173b45b8e00bb59696", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.8652240771016476, "ground_truth": 0}, {"key": "6f6964470c122807573653173b45b8e00bb59696", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.9399133554700131, "ground_truth": 0}, {"key": "6f6964470c122807573653173b45b8e00bb59696", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.9623913646738185, "ground_truth": 0}, {"key": "6f6964470c122807573653173b45b8e00bb59696", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.9549844679526031, "ground_truth": 0}, {"key": "75c6e27a38b72bb9f75fa2b8e45e933bae10dac5", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.9429286001816631, "ground_truth": 0}, {"key": "75c6e27a38b72bb9f75fa2b8e45e933bae10dac5", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.9142907208493779, "ground_truth": 0}, {"key": "75c6e27a38b72bb9f75fa2b8e45e933bae10dac5", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.9066531252800146, "ground_truth": 0}, {"key": "75c6e27a38b72bb9f75fa2b8e45e933bae10dac5", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.937210788118017, "ground_truth": 0}, {"key": "75c6e27a38b72bb9f75fa2b8e45e933bae10dac5", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.9420819133181199, "ground_truth": 0}, {"key": "9aa6463127d1efcba4403a185b29849a3688db8d", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.8732148382310571, "ground_truth": 0}, {"key": "9aa6463127d1efcba4403a185b29849a3688db8d", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.8365545554124347, "ground_truth": 0}, {"key": "9aa6463127d1efcba4403a185b29849a3688db8d", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.8783142401099813, "ground_truth": 0}, {"key": "9aa6463127d1efcba4403a185b29849a3688db8d", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.8376199671997983, "ground_truth": 0}, {"key": "9aa6463127d1efcba4403a185b29849a3688db8d", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.8019358265218146, "ground_truth": 0}, {"key": "97eda06b374f07cd9495962465775bde7d44da31", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.8749346200508876, "ground_truth": 0}, {"key": "97eda06b374f07cd9495962465775bde7d44da31", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.7931059470207302, "ground_truth": 0}, {"key": "97eda06b374f07cd9495962465775bde7d44da31", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.8519528204404323, "ground_truth": 0}, {"key": "97eda06b374f07cd9495962465775bde7d44da31", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.8848377640016525, "ground_truth": 0}, {"key": "97eda06b374f07cd9495962465775bde7d44da31", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.8006920108886079, "ground_truth": 0}, {"key": "99a6049d67c1cee35f9703ccb8e6f62a4928295a", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.8774767810979358, "ground_truth": 0}, {"key": "99a6049d67c1cee35f9703ccb8e6f62a4928295a", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.9224823456122271, "ground_truth": 0}, {"key": "99a6049d67c1cee35f9703ccb8e6f62a4928295a", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.8469578540298732, "ground_truth": 0}, {"key": "99a6049d67c1cee35f9703ccb8e6f62a4928295a", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.8791467684853563, "ground_truth": 0}, {"key": "99a6049d67c1cee35f9703ccb8e6f62a4928295a", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.8558511472564534, "ground_truth": 0}, {"key": "adcb3e7b4bef0f9efe7a838b56131ca99b587743", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.8895288545752749, "ground_truth": 0}, {"key": "adcb3e7b4bef0f9efe7a838b56131ca99b587743", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.83440688002807, "ground_truth": 0}, {"key": "adcb3e7b4bef0f9efe7a838b56131ca99b587743", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.767689854428291, "ground_truth": 0}, {"key": "adcb3e7b4bef0f9efe7a838b56131ca99b587743", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.7185943961017692, "ground_truth": 0}, {"key": "adcb3e7b4bef0f9efe7a838b56131ca99b587743", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.8322366574889027, "ground_truth": 0}, {"key": "bf7cc4e7872b7471a8ef858b8aa45eca090171da", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.6893056126817847, "ground_truth": 0}, {"key": "bf7cc4e7872b7471a8ef858b8aa45eca090171da", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.7279754420271509, "ground_truth": 0}, {"key": "bf7cc4e7872b7471a8ef858b8aa45eca090171da", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.7606506466511455, "ground_truth": 0}, {"key": "bf7cc4e7872b7471a8ef858b8aa45eca090171da", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.875786988642231, "ground_truth": 0}, {"key": "bf7cc4e7872b7471a8ef858b8aa45eca090171da", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.7170118742932021, "ground_truth": 0}, {"key": "62785b99e4007fad95ce55d427046e14aef476a4", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.7759445519447993, "ground_truth": 0}, {"key": "62785b99e4007fad95ce55d427046e14aef476a4", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.6774739997569693, "ground_truth": 0}, {"key": "62785b99e4007fad95ce55d427046e14aef476a4", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.5506073844664529, "ground_truth": 0}, {"key": "62785b99e4007fad95ce55d427046e14aef476a4", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.8344068917231439, "ground_truth": 0}, {"key": "62785b99e4007fad95ce55d427046e14aef476a4", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.8289387915979131, "ground_truth": 0}, {"key": "62fcd4ca096a182c292ae3609444bbc7af15eab6", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.8925625334914475, "ground_truth": 0}, {"key": "62fcd4ca096a182c292ae3609444bbc7af15eab6", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.6976088930996401, "ground_truth": 0}, {"key": "62fcd4ca096a182c292ae3609444bbc7af15eab6", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.8322366575178323, "ground_truth": 0}, {"key": "62fcd4ca096a182c292ae3609444bbc7af15eab6", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.8128673232880724, "ground_truth": 0}, {"key": "62fcd4ca096a182c292ae3609444bbc7af15eab6", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.8998277739456242, "ground_truth": 0}, {"key": "afdbd1bc7c79a936601b3c6cae4622464641d3a5", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.8723473788986147, "ground_truth": 0}, {"key": "afdbd1bc7c79a936601b3c6cae4622464641d3a5", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.8529354787096787, "ground_truth": 0}, {"key": "afdbd1bc7c79a936601b3c6cae4622464641d3a5", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.822189121916472, "ground_truth": 0}, {"key": "afdbd1bc7c79a936601b3c6cae4622464641d3a5", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.8940517247491663, "ground_truth": 0}, {"key": "afdbd1bc7c79a936601b3c6cae4622464641d3a5", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.9241418242390579, "ground_truth": 0}, {"key": "2a2a0fd7b85ec6f9145761795bae420d7eb84f44", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.753466648437992, "ground_truth": 0}, {"key": "2a2a0fd7b85ec6f9145761795bae420d7eb84f44", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.6076631784515827, "ground_truth": 0}, {"key": "2a2a0fd7b85ec6f9145761795bae420d7eb84f44", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.7981867880823951, "ground_truth": 0}, {"key": "2a2a0fd7b85ec6f9145761795bae420d7eb84f44", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.8019358301421651, "ground_truth": 0}, {"key": "2a2a0fd7b85ec6f9145761795bae420d7eb84f44", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.8469578523144866, "ground_truth": 0}, {"key": "f3d07208d0059d738fc7788a4ce813309b677d7b", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.6943026610998558, "ground_truth": 0}, {"key": "f3d07208d0059d738fc7788a4ce813309b677d7b", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.6723316827305174, "ground_truth": 0}, {"key": "f3d07208d0059d738fc7788a4ce813309b677d7b", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.71223218418072, "ground_truth": 0}, {"key": "f3d07208d0059d738fc7788a4ce813309b677d7b", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.6706083047687382, "ground_truth": 0}, {"key": "f3d07208d0059d738fc7788a4ce813309b677d7b", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.7704647969083965, "ground_truth": 0}, {"key": "2b8840981769a4a8f93d2e82e609ab169165cd3c", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.723309480930945, "ground_truth": 0}, {"key": "2b8840981769a4a8f93d2e82e609ab169165cd3c", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.781330620651693, "ground_truth": 0}, {"key": "2b8840981769a4a8f93d2e82e609ab169165cd3c", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.8006920037257554, "ground_truth": 0}, {"key": "2b8840981769a4a8f93d2e82e609ab169165cd3c", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.5583270049551043, "ground_truth": 0}, {"key": "2b8840981769a4a8f93d2e82e609ab169165cd3c", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.7401743609276185, "ground_truth": 0}, {"key": "4b23ce1db7253bf118b493c9bea7d6899012cc88", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.7732163723935866, "ground_truth": 0}, {"key": "4b23ce1db7253bf118b493c9bea7d6899012cc88", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.8233283915741711, "ground_truth": 0}, {"key": "4b23ce1db7253bf118b493c9bea7d6899012cc88", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.7905302976048394, "ground_truth": 0}, {"key": "4b23ce1db7253bf118b493c9bea7d6899012cc88", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.7217432050510784, "ground_truth": 0}, {"key": "4b23ce1db7253bf118b493c9bea7d6899012cc88", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.7813306216757786, "ground_truth": 0}, {"key": "c220780a60f76cdd1f6fd9a84abac736c3ee8ace", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.8244619357210541, "ground_truth": 0}, {"key": "c220780a60f76cdd1f6fd9a84abac736c3ee8ace", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.8783142521042978, "ground_truth": 0}, {"key": "c220780a60f76cdd1f6fd9a84abac736c3ee8ace", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.7606506540563038, "ground_truth": 0}, {"key": "c220780a60f76cdd1f6fd9a84abac736c3ee8ace", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.7662936720607642, "ground_truth": 0}, {"key": "c220780a60f76cdd1f6fd9a84abac736c3ee8ace", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.9046505375754205, "ground_truth": 0}, {"key": "9c7687a36469fc0e2203edb31f303274a611fb12", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.5506073411369851, "ground_truth": 0}, {"key": "9c7687a36469fc0e2203edb31f303274a611fb12", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.766293651920865, "ground_truth": 0}, {"key": "9c7687a36469fc0e2203edb31f303274a611fb12", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.5331543874007397, "ground_truth": 0}, {"key": "9c7687a36469fc0e2203edb31f303274a611fb12", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.8080672072177284, "ground_truth": 0}, {"key": "9c7687a36469fc0e2203edb31f303274a611fb12", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.5926666022417578, "ground_truth": 0}, {"key": "8ab7fe3b19bb45c977cb74ed675579a20611ad9b", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.7534666568854981, "ground_truth": 0}, {"key": "8ab7fe3b19bb45c977cb74ed675579a20611ad9b", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.7994423228194917, "ground_truth": 0}, {"key": "8ab7fe3b19bb45c977cb74ed675579a20611ad9b", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.7620701221696853, "ground_truth": 0}, {"key": "8ab7fe3b19bb45c977cb74ed675579a20611ad9b", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.6893056001866465, "ground_truth": 0}, {"key": "8ab7fe3b19bb45c977cb74ed675579a20611ad9b", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.6601723734079424, "ground_truth": 0}, {"key": "dfedf6786976733d8e33e7848ea8a7aa735bbcab", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.8633915967075265, "ground_truth": 0}, {"key": "dfedf6786976733d8e33e7848ea8a7aa735bbcab", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.7592254066232749, "ground_truth": 0}, {"key": "dfedf6786976733d8e33e7848ea8a7aa735bbcab", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.878314256656229, "ground_truth": 0}, {"key": "dfedf6786976733d8e33e7848ea8a7aa735bbcab", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.8732148249760745, "ground_truth": 0}, {"key": "dfedf6786976733d8e33e7848ea8a7aa735bbcab", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.8529354685981873, "ground_truth": 0}, {"key": "825f58580dd78cdcc7fbc10a00807e043c7b4468", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.7718434956688647, "ground_truth": 0}, {"key": "825f58580dd78cdcc7fbc10a00807e043c7b4468", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.7476159294348382, "ground_truth": 0}, {"key": "825f58580dd78cdcc7fbc10a00807e043c7b4468", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.8092759669513739, "ground_truth": 0}, {"key": "825f58580dd78cdcc7fbc10a00807e043c7b4468", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.8019358109302032, "ground_truth": 0}, {"key": "825f58580dd78cdcc7fbc10a00807e043c7b4468", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.7534666642881097, "ground_truth": 0}, {"key": "8bd6dc9f3ebb23fe20f74c1956184064b5b95509", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.8289388087481567, "ground_truth": 0}, {"key": "8bd6dc9f3ebb23fe20f74c1956184064b5b95509", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.7994423207998042, "ground_truth": 0}, {"key": "8bd6dc9f3ebb23fe20f74c1956184064b5b95509", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.8056321745919661, "ground_truth": 0}, {"key": "8bd6dc9f3ebb23fe20f74c1956184064b5b95509", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.7446563444589134, "ground_truth": 0}, {"key": "8bd6dc9f3ebb23fe20f74c1956184064b5b95509", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.7549149661358205, "ground_truth": 0}, {"key": "a7f6d4487a3ba7c4fc29e9b410820891f4c4f086", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.9385759677186073, "ground_truth": 0}, {"key": "a7f6d4487a3ba7c4fc29e9b410820891f4c4f086", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.9385759561161177, "ground_truth": 0}, {"key": "a7f6d4487a3ba7c4fc29e9b410820891f4c4f086", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.8984105578093764, "ground_truth": 0}, {"key": "a7f6d4487a3ba7c4fc29e9b410820891f4c4f086", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.8832359868250171, "ground_truth": 0}, {"key": "a7f6d4487a3ba7c4fc29e9b410820891f4c4f086", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.8895288506780863, "ground_truth": 0}, {"key": "b27ad09982665477dacdb7d06a33134bf064dd8d", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.7853085844777324, "ground_truth": 0}, {"key": "b27ad09982665477dacdb7d06a33134bf064dd8d", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.9314625075048724, "ground_truth": 0}, {"key": "b27ad09982665477dacdb7d06a33134bf064dd8d", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.9005297873988853, "ground_truth": 0}, {"key": "b27ad09982665477dacdb7d06a33134bf064dd8d", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.8749346170860716, "ground_truth": 0}, {"key": "b27ad09982665477dacdb7d06a33134bf064dd8d", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.8740772267236282, "ground_truth": 0}, {"key": "905891c3a21e76ad63d63dfe55e569a4cab25583", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.7690802432605547, "ground_truth": 0}, {"key": "905891c3a21e76ad63d63dfe55e569a4cab25583", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.8799743684848704, "ground_truth": 0}, {"key": "905891c3a21e76ad63d63dfe55e569a4cab25583", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.8976952930874678, "ground_truth": 0}, {"key": "905891c3a21e76ad63d63dfe55e569a4cab25583", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.9079671333660617, "ground_truth": 0}, {"key": "905891c3a21e76ad63d63dfe55e569a4cab25583", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.8940517247880146, "ground_truth": 0}, {"key": "626460b8ec58252c82ff5513aa754190332780aa", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.7386690608926744, "ground_truth": 0}, {"key": "626460b8ec58252c82ff5513aa754190332780aa", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.7446563462219181, "ground_truth": 0}, {"key": "626460b8ec58252c82ff5513aa754190332780aa", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.7154239830099962, "ground_truth": 0}, {"key": "626460b8ec58252c82ff5513aa754190332780aa", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.7295197639014703, "ground_truth": 0}, {"key": "626460b8ec58252c82ff5513aa754190332780aa", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.7057850354864915, "ground_truth": 0}, {"key": "31d0ed7b1b8f65c6479fb35683d72de21d70796a", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.9833429597864685, "ground_truth": 0}, {"key": "31d0ed7b1b8f65c6479fb35683d72de21d70796a", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.9798226810673395, "ground_truth": 0}, {"key": "31d0ed7b1b8f65c6479fb35683d72de21d70796a", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.9791955097982722, "ground_truth": 0}, {"key": "31d0ed7b1b8f65c6479fb35683d72de21d70796a", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.9857180666716161, "ground_truth": 0}, {"key": "31d0ed7b1b8f65c6479fb35683d72de21d70796a", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.9811668697209276, "ground_truth": 0}, {"key": "b03ee4df6492038d0a1d99a1717d8ad8ccc06db3", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.8080672092837614, "ground_truth": 0}, {"key": "b03ee4df6492038d0a1d99a1717d8ad8ccc06db3", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.6774740049798292, "ground_truth": 0}, {"key": "b03ee4df6492038d0a1d99a1717d8ad8ccc06db3", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.7718435017017817, "ground_truth": 0}, {"key": "b03ee4df6492038d0a1d99a1717d8ad8ccc06db3", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.8749346226863787, "ground_truth": 0}, {"key": "b03ee4df6492038d0a1d99a1717d8ad8ccc06db3", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.6842640127616536, "ground_truth": 0}, {"key": "ad9abc78fb2de88267b854f2aed110e2a5b8c3f1", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.9778834110387787, "ground_truth": 0}, {"key": "ad9abc78fb2de88267b854f2aed110e2a5b8c3f1", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.9681411432392747, "ground_truth": 0}, {"key": "ad9abc78fb2de88267b854f2aed110e2a5b8c3f1", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.9883127429795424, "ground_truth": 0}, {"key": "ad9abc78fb2de88267b854f2aed110e2a5b8c3f1", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.9752018382688395, "ground_truth": 0}, {"key": "ad9abc78fb2de88267b854f2aed110e2a5b8c3f1", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.9732407181075694, "ground_truth": 0}, {"key": "75cc16a7ba1970ba791da4ba43e6220f37f47697", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.9399133519087596, "ground_truth": 0}, {"key": "75cc16a7ba1970ba791da4ba43e6220f37f47697", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.9556514184256311, "ground_truth": 0}, {"key": "75cc16a7ba1970ba791da4ba43e6220f37f47697", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.9324533074792437, "ground_truth": 0}, {"key": "75cc16a7ba1970ba791da4ba43e6220f37f47697", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.9224823387296949, "ground_truth": 0}, {"key": "75cc16a7ba1970ba791da4ba43e6220f37f47697", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.950777885006478, "ground_truth": 0}, {"key": "fe9d63d0ed719a42735cadaf10e76416545f680c", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.8783142491712878, "ground_truth": 0}, {"key": "fe9d63d0ed719a42735cadaf10e76416545f680c", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.8198933294006026, "ground_truth": 0}, {"key": "fe9d63d0ed719a42735cadaf10e76416545f680c", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.8587185725398052, "ground_truth": 0}, {"key": "fe9d63d0ed719a42735cadaf10e76416545f680c", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.8558511408334539, "ground_truth": 0}, {"key": "fe9d63d0ed719a42735cadaf10e76416545f680c", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.8509647059103922, "ground_truth": 0}, {"key": "1744093a3fea8b8de0777b1a228c3ba3e515d48e", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.712232173630826, "ground_truth": 0}, {"key": "1744093a3fea8b8de0777b1a228c3ba3e515d48e", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.7386690738254895, "ground_truth": 0}, {"key": "1744093a3fea8b8de0777b1a228c3ba3e515d48e", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.7461389887272568, "ground_truth": 0}, {"key": "1744093a3fea8b8de0777b1a228c3ba3e515d48e", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.5945512739068285, "ground_truth": 0}, {"key": "1744093a3fea8b8de0777b1a228c3ba3e515d48e", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.795658095944247, "ground_truth": 0}, {"key": "4929479f70e89deb22539e7d2caa6c33bbb0a14f", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.8568122894749095, "ground_truth": 0}, {"key": "4929479f70e89deb22539e7d2caa6c33bbb0a14f", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.6442251224487606, "ground_truth": 0}, {"key": "4929479f70e89deb22539e7d2caa6c33bbb0a14f", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.6406358665380513, "ground_truth": 0}, {"key": "4929479f70e89deb22539e7d2caa6c33bbb0a14f", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.7446563454982245, "ground_truth": 0}, {"key": "4929479f70e89deb22539e7d2caa6c33bbb0a14f", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.7154239846549885, "ground_truth": 0}, {"key": "4dd3bb1fe7a5b0d42f0df8d9e62b81c673475420", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.9059898119176025, "ground_truth": 0}, {"key": "4dd3bb1fe7a5b0d42f0df8d9e62b81c673475420", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.8705972585725263, "ground_truth": 0}, {"key": "4dd3bb1fe7a5b0d42f0df8d9e62b81c673475420", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.8872045985445746, "ground_truth": 0}, {"key": "4dd3bb1fe7a5b0d42f0df8d9e62b81c673475420", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.8311430458874667, "ground_truth": 0}, {"key": "4dd3bb1fe7a5b0d42f0df8d9e62b81c673475420", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.8397339623340349, "ground_truth": 0}, {"key": "32f0c7b0845e88c7ff34bb9d358a86e029dc2261", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.7416739844921965, "ground_truth": 0}, {"key": "32f0c7b0845e88c7ff34bb9d358a86e029dc2261", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.7994423228194917, "ground_truth": 0}, {"key": "32f0c7b0845e88c7ff34bb9d358a86e029dc2261", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.7386691058805703, "ground_truth": 0}, {"key": "32f0c7b0845e88c7ff34bb9d358a86e029dc2261", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.6113819563507422, "ground_truth": 0}, {"key": "32f0c7b0845e88c7ff34bb9d358a86e029dc2261", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.6601723734079424, "ground_truth": 0}, {"key": "607ce3caeeac56d7c4250aaa161871535cd1251e", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.8558511534622152, "ground_truth": 0}, {"key": "607ce3caeeac56d7c4250aaa161871535cd1251e", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.8688267820242946, "ground_truth": 0}, {"key": "607ce3caeeac56d7c4250aaa161871535cd1251e", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.7563575852740045, "ground_truth": 0}, {"key": "607ce3caeeac56d7c4250aaa161871535cd1251e", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.8539127546322647, "ground_truth": 0}, {"key": "607ce3caeeac56d7c4250aaa161871535cd1251e", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.7732163697075759, "ground_truth": 0}, {"key": "7fb19f75d5d3feefeababf62d2ac91bf684a8038", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.9449947121168232, "ground_truth": 0}, {"key": "7fb19f75d5d3feefeababf62d2ac91bf684a8038", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.9711290922474749, "ground_truth": 0}, {"key": "7fb19f75d5d3feefeababf62d2ac91bf684a8038", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.9136765268309325, "ground_truth": 0}, {"key": "7fb19f75d5d3feefeababf62d2ac91bf684a8038", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.9477691424434125, "ground_truth": 0}, {"key": "7fb19f75d5d3feefeababf62d2ac91bf684a8038", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.9481545306902756, "ground_truth": 0}, {"key": "4a70f83728ee66801be719df00060cda4c25817f", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.753466652696395, "ground_truth": 0}, {"key": "4a70f83728ee66801be719df00060cda4c25817f", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.7490872143096283, "ground_truth": 0}, {"key": "4a70f83728ee66801be719df00060cda4c25817f", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.8386797547340021, "ground_truth": 0}, {"key": "4a70f83728ee66801be719df00060cda4c25817f", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.762070095419919, "ground_truth": 0}, {"key": "4a70f83728ee66801be719df00060cda4c25817f", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.8732148344642365, "ground_truth": 0}, {"key": "dcfc0e6ff732124026991e89d50727876f50351f", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.8365545670722129, "ground_truth": 0}, {"key": "dcfc0e6ff732124026991e89d50727876f50351f", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.717011849540796, "ground_truth": 0}, {"key": "dcfc0e6ff732124026991e89d50727876f50351f", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.7969253771225221, "ground_truth": 0}, {"key": "dcfc0e6ff732124026991e89d50727876f50351f", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.8221891236053478, "ground_truth": 0}, {"key": "dcfc0e6ff732124026991e89d50727876f50351f", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.8998277775617262, "ground_truth": 0}, {"key": "ace7f6d9e984397bda16bf441019f1584f036b2a", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.9798226811688524, "ground_truth": 0}, {"key": "ace7f6d9e984397bda16bf441019f1584f036b2a", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.9864678508250699, "ground_truth": 0}, {"key": "ace7f6d9e984397bda16bf441019f1584f036b2a", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.9798226814283515, "ground_truth": 0}, {"key": "ace7f6d9e984397bda16bf441019f1584f036b2a", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.9732407164257543, "ground_truth": 0}, {"key": "ace7f6d9e984397bda16bf441019f1584f036b2a", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.9666631753108759, "ground_truth": 0}, {"key": "6f12c9d47e70bfa86d72685d018ddd1161157e8e", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.8418256407121788, "ground_truth": 0}, {"key": "6f12c9d47e70bfa86d72685d018ddd1161157e8e", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.9425067251058006, "ground_truth": 0}, {"key": "6f12c9d47e70bfa86d72685d018ddd1161157e8e", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.8740772318102441, "ground_truth": 0}, {"key": "6f12c9d47e70bfa86d72685d018ddd1161157e8e", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.9066531285916967, "ground_truth": 0}, {"key": "6f12c9d47e70bfa86d72685d018ddd1161157e8e", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.9477691459573957, "ground_truth": 0}, {"key": "b32b72e5cf9e133e5be33eccbb2dc9ab5578ae84", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.7592254022463206, "ground_truth": 0}, {"key": "b32b72e5cf9e133e5be33eccbb2dc9ab5578ae84", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.8255897227510428, "ground_truth": 0}, {"key": "b32b72e5cf9e133e5be33eccbb2dc9ab5578ae84", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.7386690625533445, "ground_truth": 0}, {"key": "b32b72e5cf9e133e5be33eccbb2dc9ab5578ae84", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.8198933412263928, "ground_truth": 0}, {"key": "b32b72e5cf9e133e5be33eccbb2dc9ab5578ae84", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.8577681158274847, "ground_truth": 0}, {"key": "0ae5e35dc2844afc251d082d8d5ef4be8edce58c", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.7279754311610541, "ground_truth": 0}, {"key": "0ae5e35dc2844afc251d082d8d5ef4be8edce58c", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.93096207470276, "ground_truth": 0}, {"key": "0ae5e35dc2844afc251d082d8d5ef4be8edce58c", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.895522678901993, "ground_truth": 0}, {"key": "0ae5e35dc2844afc251d082d8d5ef4be8edce58c", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.8723473844339777, "ground_truth": 0}, {"key": "0ae5e35dc2844afc251d082d8d5ef4be8edce58c", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.9441768608105846, "ground_truth": 0}, {"key": "ffb817ce85d7c19720ebbf0b43b01d0da61e9c06", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.7170118723071038, "ground_truth": 0}, {"key": "ffb817ce85d7c19720ebbf0b43b01d0da61e9c06", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.8092759749705333, "ground_truth": 0}, {"key": "ffb817ce85d7c19720ebbf0b43b01d0da61e9c06", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.8489722025878538, "ground_truth": 0}, {"key": "ffb817ce85d7c19720ebbf0b43b01d0da61e9c06", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.7662936494540727, "ground_truth": 0}, {"key": "ffb817ce85d7c19720ebbf0b43b01d0da61e9c06", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.8056321848112605, "ground_truth": 0}, {"key": "9bfd6a5beb4e8dec59ba6d805dc9349a401da51d", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.8766343836494128, "ground_truth": 0}, {"key": "9bfd6a5beb4e8dec59ba6d805dc9349a401da51d", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.5389832165911764, "ground_truth": 0}, {"key": "9bfd6a5beb4e8dec59ba6d805dc9349a401da51d", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.6943026680171717, "ground_truth": 0}, {"key": "9bfd6a5beb4e8dec59ba6d805dc9349a401da51d", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.726425621802948, "ground_truth": 0}, {"key": "9bfd6a5beb4e8dec59ba6d805dc9349a401da51d", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.6926419904050389, "ground_truth": 0}, {"key": "dc7f4527bf654918c7a4bb19179949ecd5982c0f", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.9299510372141468, "ground_truth": 0}, {"key": "dc7f4527bf654918c7a4bb19179949ecd5982c0f", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.8895288555075588, "ground_truth": 0}, {"key": "dc7f4527bf654918c7a4bb19179949ecd5982c0f", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.9500414730118557, "ground_truth": 0}, {"key": "dc7f4527bf654918c7a4bb19179949ecd5982c0f", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.960361160262986, "ground_truth": 0}, {"key": "dc7f4527bf654918c7a4bb19179949ecd5982c0f", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.9674102569021742, "ground_truth": 0}, {"key": "c60e77736087bc85b372a28b4724aae6dcf0b052", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.8816149038637306, "ground_truth": 0}, {"key": "c60e77736087bc85b372a28b4724aae6dcf0b052", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.8469578485377118, "ground_truth": 0}, {"key": "c60e77736087bc85b372a28b4724aae6dcf0b052", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.7401743676548285, "ground_truth": 0}, {"key": "c60e77736087bc85b372a28b4724aae6dcf0b052", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.8300437698517192, "ground_truth": 0}, {"key": "c60e77736087bc85b372a28b4724aae6dcf0b052", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.8783142372494231, "ground_truth": 0}, {"key": "e0953e2de7cf286ac1d87a41c62e37f21b7c7564", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.8679338498211712, "ground_truth": 0}, {"key": "e0953e2de7cf286ac1d87a41c62e37f21b7c7564", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.8947894653846967, "ground_truth": 0}, {"key": "e0953e2de7cf286ac1d87a41c62e37f21b7c7564", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.9136765216761716, "ground_truth": 0}, {"key": "e0953e2de7cf286ac1d87a41c62e37f21b7c7564", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.9219218362871482, "ground_truth": 0}, {"key": "e0953e2de7cf286ac1d87a41c62e37f21b7c7564", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.8633916122198061, "ground_truth": 0}, {"key": "8b6f228661fd5f3170dc2c2e6b353e1d6c3859ec", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.5869964670912158, "ground_truth": 0}, {"key": "8b6f228661fd5f3170dc2c2e6b353e1d6c3859ec", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.8300437688490578, "ground_truth": 0}, {"key": "8b6f228661fd5f3170dc2c2e6b353e1d6c3859ec", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.824461937359479, "ground_truth": 0}, {"key": "8b6f228661fd5f3170dc2c2e6b353e1d6c3859ec", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.7025300608992069, "ground_truth": 0}, {"key": "8b6f228661fd5f3170dc2c2e6b353e1d6c3859ec", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.6548947541543199, "ground_truth": 0}, {"key": "2f482e021caf07e2f07baf111c36d1587758f188", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.9111797125648797, "ground_truth": 0}, {"key": "2f482e021caf07e2f07baf111c36d1587758f188", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.7943849467621162, "ground_truth": 0}, {"key": "2f482e021caf07e2f07baf111c36d1587758f188", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.9099070070000432, "ground_truth": 0}, {"key": "2f482e021caf07e2f07baf111c36d1587758f188", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.8376199759661636, "ground_truth": 0}, {"key": "2f482e021caf07e2f07baf111c36d1587758f188", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.7826624698684326, "ground_truth": 0}, {"key": "dc8ce4207b91a323bf6e2fbab889efeed22aa428", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.7969253663110752, "ground_truth": 0}, {"key": "dc8ce4207b91a323bf6e2fbab889efeed22aa428", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.8529354635880498, "ground_truth": 0}, {"key": "dc8ce4207b91a323bf6e2fbab889efeed22aa428", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.860603623838167, "ground_truth": 0}, {"key": "dc8ce4207b91a323bf6e2fbab889efeed22aa428", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.8300437611097484, "ground_truth": 0}, {"key": "dc8ce4207b91a323bf6e2fbab889efeed22aa428", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.8740772230811678, "ground_truth": 0}, {"key": "22a9005fe99c5dd536a4f41de4eb59d4f633ef9e", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.746139005744795, "ground_truth": 0}, {"key": "22a9005fe99c5dd536a4f41de4eb59d4f633ef9e", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.8984105544185482, "ground_truth": 0}, {"key": "22a9005fe99c5dd536a4f41de4eb59d4f633ef9e", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.8910549499048762, "ground_truth": 0}, {"key": "22a9005fe99c5dd536a4f41de4eb59d4f633ef9e", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.8539127497613582, "ground_truth": 0}, {"key": "22a9005fe99c5dd536a4f41de4eb59d4f633ef9e", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.861538209601203, "ground_truth": 0}, {"key": "1b00b2d2edef396855ad392f08a6e74550af569b", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.8221891295768445, "ground_truth": 0}, {"key": "1b00b2d2edef396855ad392f08a6e74550af569b", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.946200358239976, "ground_truth": 0}, {"key": "1b00b2d2edef396855ad392f08a6e74550af569b", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.8267117866283314, "ground_truth": 0}, {"key": "1b00b2d2edef396855ad392f08a6e74550af569b", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.8548846349268815, "ground_truth": 0}, {"key": "1b00b2d2edef396855ad392f08a6e74550af569b", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.8438950971602984, "ground_truth": 0}, {"key": "9b43472077873c45e7f278418885ad028eb993e3", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.7217432182575707, "ground_truth": 0}, {"key": "9b43472077873c45e7f278418885ad028eb993e3", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.6757646129750016, "ground_truth": 0}, {"key": "9b43472077873c45e7f278418885ad028eb993e3", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.7233094807952161, "ground_truth": 0}, {"key": "9b43472077873c45e7f278418885ad028eb993e3", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.808067213233286, "ground_truth": 0}, {"key": "9b43472077873c45e7f278418885ad028eb993e3", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.7279754266809518, "ground_truth": 0}, {"key": "281347d0e99bc099d6991a6a60e30dc13d558216", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.7786493012498316, "ground_truth": 0}, {"key": "281347d0e99bc099d6991a6a60e30dc13d558216", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.7490872168418653, "ground_truth": 0}, {"key": "281347d0e99bc099d6991a6a60e30dc13d558216", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.8031737938345037, "ground_truth": 0}, {"key": "281347d0e99bc099d6991a6a60e30dc13d558216", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.8449215215720883, "ground_truth": 0}, {"key": "281347d0e99bc099d6991a6a60e30dc13d558216", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.7648916069561245, "ground_truth": 0}, {"key": "703d248cce913a6036347aabd2ba011a7f660bf4", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.914290726977099, "ground_truth": 0}, {"key": "703d248cce913a6036347aabd2ba011a7f660bf4", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.8255897195885452, "ground_truth": 0}, {"key": "703d248cce913a6036347aabd2ba011a7f660bf4", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.8864204149778883, "ground_truth": 0}, {"key": "703d248cce913a6036347aabd2ba011a7f660bf4", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.8705972723785188, "ground_truth": 0}, {"key": "703d248cce913a6036347aabd2ba011a7f660bf4", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.8418256503360323, "ground_truth": 0}, {"key": "517b86691dda04f41123354c1b7a7bfe1290eadc", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.9257686322366003, "ground_truth": 0}, {"key": "517b86691dda04f41123354c1b7a7bfe1290eadc", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.7248702814789598, "ground_truth": 0}, {"key": "517b86691dda04f41123354c1b7a7bfe1290eadc", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.8799743700639995, "ground_truth": 0}, {"key": "517b86691dda04f41123354c1b7a7bfe1290eadc", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.8714748700806728, "ground_truth": 0}, {"key": "517b86691dda04f41123354c1b7a7bfe1290eadc", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.8577681149808094, "ground_truth": 0}, {"key": "7b361feeebfb078b80831d40d2ad8640c361e049", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.9648551534960721, "ground_truth": 0}, {"key": "7b361feeebfb078b80831d40d2ad8640c361e049", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.9748211588594927, "ground_truth": 0}, {"key": "7b361feeebfb078b80831d40d2ad8640c361e049", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.9671630462761548, "ground_truth": 0}, {"key": "7b361feeebfb078b80831d40d2ad8640c361e049", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.9597620538022721, "ground_truth": 0}, {"key": "7b361feeebfb078b80831d40d2ad8640c361e049", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.9825575155057447, "ground_truth": 0}, {"key": "7d8e196095e4561ee4f01c650101f5591fce4a8d", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.7662936410524176, "ground_truth": 0}, {"key": "7d8e196095e4561ee4f01c650101f5591fce4a8d", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.8333245983976041, "ground_truth": 0}, {"key": "7d8e196095e4561ee4f01c650101f5591fce4a8d", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.82332839718179, "ground_truth": 0}, {"key": "7d8e196095e4561ee4f01c650101f5591fce4a8d", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.8824278629091041, "ground_truth": 0}, {"key": "7d8e196095e4561ee4f01c650101f5591fce4a8d", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.8376199744580121, "ground_truth": 0}, {"key": "ae03390949407f55c8d8f794896af3020d180b12", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.8428631507546689, "ground_truth": 0}, {"key": "ae03390949407f55c8d8f794896af3020d180b12", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.8068526270278769, "ground_truth": 0}, {"key": "ae03390949407f55c8d8f794896af3020d180b12", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.7866228315918007, "ground_truth": 0}, {"key": "ae03390949407f55c8d8f794896af3020d180b12", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.8210441037118194, "ground_truth": 0}, {"key": "ae03390949407f55c8d8f794896af3020d180b12", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.8365545747958973, "ground_truth": 0}, {"key": "4160464d3fcba547cb1664e54ce51ad06f78b773", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.8749346181637268, "ground_truth": 0}, {"key": "4160464d3fcba547cb1664e54ce51ad06f78b773", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.5698526377885257, "ground_truth": 0}, {"key": "4160464d3fcba547cb1664e54ce51ad06f78b773", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.874934617847512, "ground_truth": 0}, {"key": "4160464d3fcba547cb1664e54ce51ad06f78b773", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.8221891291954428, "ground_truth": 0}, {"key": "4160464d3fcba547cb1664e54ce51ad06f78b773", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.8918110454371591, "ground_truth": 0}, {"key": "72b396634cc46f29b5ef146a61073ee7e7fa3cdc", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.9661559685076608, "ground_truth": 0}, {"key": "72b396634cc46f29b5ef146a61073ee7e7fa3cdc", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.9722043750882793, "ground_truth": 0}, {"key": "72b396634cc46f29b5ef146a61073ee7e7fa3cdc", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.9612438044703873, "ground_truth": 0}, {"key": "72b396634cc46f29b5ef146a61073ee7e7fa3cdc", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.937668959126936, "ground_truth": 0}, {"key": "72b396634cc46f29b5ef146a61073ee7e7fa3cdc", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.9693242004390509, "ground_truth": 0}, {"key": "b9b09b290cdf4d74cb64684a6cae8b6832645607", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.8757869877637412, "ground_truth": 0}, {"key": "b9b09b290cdf4d74cb64684a6cae8b6832645607", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.8991213886565892, "ground_truth": 0}, {"key": "b9b09b290cdf4d74cb64684a6cae8b6832645607", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.8596637465700495, "ground_truth": 0}, {"key": "b9b09b290cdf4d74cb64684a6cae8b6832645607", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.9299510352179922, "ground_truth": 0}, {"key": "b9b09b290cdf4d74cb64684a6cae8b6832645607", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.911809956885455, "ground_truth": 0}, {"key": "9e49d58fa5ab7f3e4356cb61337605ac007c49ca", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.6876299925410132, "ground_truth": 0}, {"key": "9e49d58fa5ab7f3e4356cb61337605ac007c49ca", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.8774767882796157, "ground_truth": 0}, {"key": "9e49d58fa5ab7f3e4356cb61337605ac007c49ca", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.7008948080937651, "ground_truth": 0}, {"key": "9e49d58fa5ab7f3e4356cb61337605ac007c49ca", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.84695783961315, "ground_truth": 0}, {"key": "9e49d58fa5ab7f3e4356cb61337605ac007c49ca", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.8092759780066763, "ground_truth": 0}, {"key": "47fe0e2bba8206014fb53a7d5247efd1e316e087", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.846957843053029, "ground_truth": 0}, {"key": "47fe0e2bba8206014fb53a7d5247efd1e316e087", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.8872045976034032, "ground_truth": 0}, {"key": "47fe0e2bba8206014fb53a7d5247efd1e316e087", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.7563575429358447, "ground_truth": 0}, {"key": "47fe0e2bba8206014fb53a7d5247efd1e316e087", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.9348724492815558, "ground_truth": 0}, {"key": "47fe0e2bba8206014fb53a7d5247efd1e316e087", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.8255897184114961, "ground_truth": 0}, {"key": "f54f84affaebd1d86011ad31adbf9fac4754a8f2", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.8210440931058999, "ground_truth": 0}, {"key": "f54f84affaebd1d86011ad31adbf9fac4754a8f2", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.8128673114876974, "ground_truth": 0}, {"key": "f54f84affaebd1d86011ad31adbf9fac4754a8f2", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.9507778855005081, "ground_truth": 0}, {"key": "f54f84affaebd1d86011ad31adbf9fac4754a8f2", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.9294404031467521, "ground_truth": 0}, {"key": "f54f84affaebd1d86011ad31adbf9fac4754a8f2", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.8856314728034322, "ground_truth": 0}, {"key": "bc4992871e25e6584936af456ad4b819dcc52f27", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.7943849665869409, "ground_truth": 0}, {"key": "bc4992871e25e6584936af456ad4b819dcc52f27", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.8128673138294787, "ground_truth": 0}, {"key": "bc4992871e25e6584936af456ad4b819dcc52f27", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.8198933456094788, "ground_truth": 0}, {"key": "bc4992871e25e6584936af456ad4b819dcc52f27", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.8407825857066038, "ground_truth": 0}, {"key": "bc4992871e25e6584936af456ad4b819dcc52f27", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.7704648056800734, "ground_truth": 0}, {"key": "271416bf0f15c52a4417339de78dcecf378b3950", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.9118099588964006, "ground_truth": 0}, {"key": "271416bf0f15c52a4417339de78dcecf378b3950", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.932943713327885, "ground_truth": 0}, {"key": "271416bf0f15c52a4417339de78dcecf378b3950", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.8479677445176917, "ground_truth": 0}, {"key": "271416bf0f15c52a4417339de78dcecf378b3950", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.9086178900986787, "ground_truth": 0}, {"key": "271416bf0f15c52a4417339de78dcecf378b3950", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.9289263339115493, "ground_truth": 0}, {"key": "0add6b43e18072837f0bef41031d6f92f740d625", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.7461390056874697, "ground_truth": 0}, {"key": "0add6b43e18072837f0bef41031d6f92f740d625", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.7549150027299744, "ground_truth": 0}, {"key": "0add6b43e18072837f0bef41031d6f92f740d625", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.7371581558507361, "ground_truth": 0}, {"key": "0add6b43e18072837f0bef41031d6f92f740d625", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.7634837964599329, "ground_truth": 0}, {"key": "0add6b43e18072837f0bef41031d6f92f740d625", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.7879311948259391, "ground_truth": 0}, {"key": "7060e3feb685bda7b5102e1cc8e9b35da37ca2a1", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.909907000093025, "ground_truth": 0}, {"key": "7060e3feb685bda7b5102e1cc8e9b35da37ca2a1", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.946596665534594, "ground_truth": 0}, {"key": "7060e3feb685bda7b5102e1cc8e9b35da37ca2a1", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.8479677502889835, "ground_truth": 0}, {"key": "7060e3feb685bda7b5102e1cc8e9b35da37ca2a1", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.9086178959324873, "ground_truth": 0}, {"key": "7060e3feb685bda7b5102e1cc8e9b35da37ca2a1", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.8766343883717467, "ground_truth": 0}, {"key": "04fbd3088e8610dd4d5bea709e7cc5ee3e53710d", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.9284088028373205, "ground_truth": 0}, {"key": "04fbd3088e8610dd4d5bea709e7cc5ee3e53710d", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.8479677550062663, "ground_truth": 0}, {"key": "04fbd3088e8610dd4d5bea709e7cc5ee3e53710d", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.8080672190177799, "ground_truth": 0}, {"key": "04fbd3088e8610dd4d5bea709e7cc5ee3e53710d", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.8962513716177641, "ground_truth": 0}, {"key": "04fbd3088e8610dd4d5bea709e7cc5ee3e53710d", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.8407825910729949, "ground_truth": 0}, {"key": "b198f0356c0f0cb09aba4d7d5541dd7c5ce91678", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.6926419728224608, "ground_truth": 0}, {"key": "b198f0356c0f0cb09aba4d7d5541dd7c5ce91678", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.8705972585725263, "ground_truth": 0}, {"key": "b198f0356c0f0cb09aba4d7d5541dd7c5ce91678", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.8044059375123498, "ground_truth": 0}, {"key": "b198f0356c0f0cb09aba4d7d5541dd7c5ce91678", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.7853085855184113, "ground_truth": 0}, {"key": "b198f0356c0f0cb09aba4d7d5541dd7c5ce91678", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.8397339623340349, "ground_truth": 0}, {"key": "0f60442453e038c6bbe3aa525bedf2a97f459e04", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.8354835553121054, "ground_truth": 0}, {"key": "0f60442453e038c6bbe3aa525bedf2a97f459e04", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.9235923197127699, "ground_truth": 0}, {"key": "0f60442453e038c6bbe3aa525bedf2a97f459e04", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.9381240170375893, "ground_truth": 0}, {"key": "0f60442453e038c6bbe3aa525bedf2a97f459e04", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.9066531320098098, "ground_truth": 0}, {"key": "0f60442453e038c6bbe3aa525bedf2a97f459e04", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.9477691459864668, "ground_truth": 0}, {"key": "79b423b90af6b3381ebfa34a7382ca472bdb5b35", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.7981867798318292, "ground_truth": 0}, {"key": "79b423b90af6b3381ebfa34a7382ca472bdb5b35", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.6825737280270947, "ground_truth": 0}, {"key": "79b423b90af6b3381ebfa34a7382ca472bdb5b35", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.8606036235780938, "ground_truth": 0}, {"key": "79b423b90af6b3381ebfa34a7382ca472bdb5b35", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.70089480495849, "ground_truth": 0}, {"key": "79b423b90af6b3381ebfa34a7382ca472bdb5b35", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.7431680178116619, "ground_truth": 0}, {"key": "3e5a3a2dddee7ebebe57c12d0ace97a24cbabd72", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.9092645141817102, "ground_truth": 0}, {"key": "3e5a3a2dddee7ebebe57c12d0ace97a24cbabd72", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.87578698559839, "ground_truth": 0}, {"key": "3e5a3a2dddee7ebebe57c12d0ace97a24cbabd72", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.9462003555241608, "ground_truth": 0}, {"key": "3e5a3a2dddee7ebebe57c12d0ace97a24cbabd72", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.8705972668626786, "ground_truth": 0}, {"key": "3e5a3a2dddee7ebebe57c12d0ace97a24cbabd72", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.9329437129707391, "ground_truth": 0}, {"key": "c623e4914c04811d354fa137e3bf7a00980ef7d7", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.808067207909291, "ground_truth": 0}, {"key": "c623e4914c04811d354fa137e3bf7a00980ef7d7", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.8397339733404292, "ground_truth": 0}, {"key": "c623e4914c04811d354fa137e3bf7a00980ef7d7", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.7264256174049004, "ground_truth": 0}, {"key": "c623e4914c04811d354fa137e3bf7a00980ef7d7", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.8116760122162022, "ground_truth": 0}, {"key": "c623e4914c04811d354fa137e3bf7a00980ef7d7", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.731058565253743, "ground_truth": 0}, {"key": "d5ef1fb6f2df20e46fb032b9e318bc8555283e78", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.7994423272653474, "ground_truth": 0}, {"key": "d5ef1fb6f2df20e46fb032b9e318bc8555283e78", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.8479677723667562, "ground_truth": 0}, {"key": "d5ef1fb6f2df20e46fb032b9e318bc8555283e78", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.8019358279143004, "ground_truth": 0}, {"key": "d5ef1fb6f2df20e46fb032b9e318bc8555283e78", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.8175744629582482, "ground_truth": 0}, {"key": "d5ef1fb6f2df20e46fb032b9e318bc8555283e78", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.8856314786747537, "ground_truth": 0}, {"key": "e1a36c50adadc5db9ffe6fd2c5e275d522902193", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.9039745077901236, "ground_truth": 0}, {"key": "e1a36c50adadc5db9ffe6fd2c5e275d522902193", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.8984105525607209, "ground_truth": 0}, {"key": "e1a36c50adadc5db9ffe6fd2c5e275d522902193", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.8267117882313773, "ground_truth": 0}, {"key": "e1a36c50adadc5db9ffe6fd2c5e275d522902193", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.8895288333561087, "ground_truth": 0}, {"key": "e1a36c50adadc5db9ffe6fd2c5e275d522902193", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.9263037252590699, "ground_truth": 0}, {"key": "bad69c9a3c7d84a4717705a3063dd7367243772b", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.7563575493151028, "ground_truth": 0}, {"key": "bad69c9a3c7d84a4717705a3063dd7367243772b", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.5832033395658363, "ground_truth": 0}, {"key": "bad69c9a3c7d84a4717705a3063dd7367243772b", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.7549149886981922, "ground_truth": 0}, {"key": "bad69c9a3c7d84a4717705a3063dd7367243772b", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.7310585711714641, "ground_truth": 0}, {"key": "bad69c9a3c7d84a4717705a3063dd7367243772b", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.8255897263633208, "ground_truth": 0}, {"key": "4b40ad1f0e59b139e9a1466859ee08a048ca8d2c", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.8864204090883846, "ground_truth": 0}, {"key": "4b40ad1f0e59b139e9a1466859ee08a048ca8d2c", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.8633916044935415, "ground_truth": 0}, {"key": "4b40ad1f0e59b139e9a1466859ee08a048ca8d2c", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.8428631441112605, "ground_truth": 0}, {"key": "4b40ad1f0e59b139e9a1466859ee08a048ca8d2c", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.8714748684886434, "ground_truth": 0}, {"key": "4b40ad1f0e59b139e9a1466859ee08a048ca8d2c", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.8791467675141091, "ground_truth": 0}, {"key": "c17a30b4c0f8f58e3afa6279a39470f65a179f6b", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.8902942271108375, "ground_truth": 0}, {"key": "c17a30b4c0f8f58e3afa6279a39470f65a179f6b", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.8688267823322918, "ground_truth": 0}, {"key": "c17a30b4c0f8f58e3afa6279a39470f65a179f6b", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.6636689505255368, "ground_truth": 0}, {"key": "c17a30b4c0f8f58e3afa6279a39470f65a179f6b", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.7745833785681036, "ground_truth": 0}, {"key": "c17a30b4c0f8f58e3afa6279a39470f65a179f6b", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.8459424426309929, "ground_truth": 0}, {"key": "6f579aad2d1f601b17e01057cd4b5e4942627230", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.729519799135522, "ground_truth": 0}, {"key": "6f579aad2d1f601b17e01057cd4b5e4942627230", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.7577943735177566, "ground_truth": 0}, {"key": "6f579aad2d1f601b17e01057cd4b5e4942627230", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.8116760332745356, "ground_truth": 0}, {"key": "6f579aad2d1f601b17e01057cd4b5e4942627230", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.677474016837066, "ground_truth": 0}, {"key": "6f579aad2d1f601b17e01057cd4b5e4942627230", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.6261241856750404, "ground_truth": 0}, {"key": "7551f8e13485bb1738c16eccad343a14a47b2903", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.7839884570385803, "ground_truth": 0}, {"key": "7551f8e13485bb1738c16eccad343a14a47b2903", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.8714748585575124, "ground_truth": 0}, {"key": "7551f8e13485bb1738c16eccad343a14a47b2903", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.8499711739129345, "ground_truth": 0}, {"key": "7551f8e13485bb1738c16eccad343a14a47b2903", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.8757869867242176, "ground_truth": 0}, {"key": "7551f8e13485bb1738c16eccad343a14a47b2903", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.8221891277778242, "ground_truth": 0}, {"key": "257d8d38863175ec9401d0532963fb71a47f0734", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.8300437527200653, "ground_truth": 0}, {"key": "257d8d38863175ec9401d0532963fb71a47f0734", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.8019358145662183, "ground_truth": 0}, {"key": "257d8d38863175ec9401d0532963fb71a47f0734", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.7981867874232167, "ground_truth": 0}, {"key": "257d8d38863175ec9401d0532963fb71a47f0734", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.8714748647198508, "ground_truth": 0}, {"key": "257d8d38863175ec9401d0532963fb71a47f0734", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.7813306179952921, "ground_truth": 0}, {"key": "aa596e10dfe78dd875a7e15bfd53138bc8bde471", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.5583269702937358, "ground_truth": 0}, {"key": "aa596e10dfe78dd875a7e15bfd53138bc8bde471", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.6495786075257602, "ground_truth": 0}, {"key": "aa596e10dfe78dd875a7e15bfd53138bc8bde471", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.5331543882258705, "ground_truth": 0}, {"key": "aa596e10dfe78dd875a7e15bfd53138bc8bde471", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.5794003980264643, "ground_truth": 0}, {"key": "aa596e10dfe78dd875a7e15bfd53138bc8bde471", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.598312213638061, "ground_truth": 0}, {"key": "a0dff972172125f32b79977a47b0d250be8f71e4", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.9111797124741354, "ground_truth": 0}, {"key": "a0dff972172125f32b79977a47b0d250be8f71e4", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.9594592596208946, "ground_truth": 0}, {"key": "a0dff972172125f32b79977a47b0d250be8f71e4", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.9353465112682521, "ground_truth": 0}, {"key": "a0dff972172125f32b79977a47b0d250be8f71e4", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.7446563659515505, "ground_truth": 0}, {"key": "a0dff972172125f32b79977a47b0d250be8f71e4", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.9130583405344896, "ground_truth": 0}, {"key": "faac3a6337907b1552b7068c8701cae665c4885c", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.8407826009437981, "ground_truth": 0}, {"key": "faac3a6337907b1552b7068c8701cae665c4885c", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.7943849545309457, "ground_truth": 0}, {"key": "faac3a6337907b1552b7068c8701cae665c4885c", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.7732163636512985, "ground_truth": 0}, {"key": "faac3a6337907b1552b7068c8701cae665c4885c", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.7620701190778274, "ground_truth": 0}, {"key": "faac3a6337907b1552b7068c8701cae665c4885c", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.7648916209782486, "ground_truth": 0}, {"key": "c741b211364d761605050776064a506d24378d10", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.8449215309087919, "ground_truth": 0}, {"key": "c741b211364d761605050776064a506d24378d10", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.7310585818683597, "ground_truth": 0}, {"key": "c741b211364d761605050776064a506d24378d10", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.7090191259293361, "ground_truth": 0}, {"key": "c741b211364d761605050776064a506d24378d10", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.800691991272168, "ground_truth": 0}, {"key": "c741b211364d761605050776064a506d24378d10", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.7356416505170561, "ground_truth": 0}, {"key": "a062b8ba08369be2364a863020a28de63a3cbf86", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.9252299490870615, "ground_truth": 0}, {"key": "a062b8ba08369be2364a863020a28de63a3cbf86", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.9224823408902203, "ground_truth": 0}, {"key": "a062b8ba08369be2364a863020a28de63a3cbf86", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.8848377656790946, "ground_truth": 0}, {"key": "a062b8ba08369be2364a863020a28de63a3cbf86", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.9124361532412897, "ground_truth": 0}, {"key": "a062b8ba08369be2364a863020a28de63a3cbf86", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.9059898122036291, "ground_truth": 0}, {"key": "f11102404d23702fe398b1d690d13418703e617a", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.9543079666215345, "ground_truth": 0}, {"key": "f11102404d23702fe398b1d690d13418703e617a", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.9124361614590845, "ground_truth": 0}, {"key": "f11102404d23702fe398b1d690d13418703e617a", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.9284087981532863, "ground_truth": 0}, {"key": "f11102404d23702fe398b1d690d13418703e617a", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.9543079674851783, "ground_truth": 0}, {"key": "f11102404d23702fe398b1d690d13418703e617a", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.9367494872060009, "ground_truth": 0}, {"key": "62481fda7e7b9714b994617909349550707fe8a7", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.8311430535189595, "ground_truth": 0}, {"key": "62481fda7e7b9714b994617909349550707fe8a7", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.8418256544974231, "ground_truth": 0}, {"key": "62481fda7e7b9714b994617909349550707fe8a7", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.8740772285005889, "ground_truth": 0}, {"key": "62481fda7e7b9714b994617909349550707fe8a7", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.6825737682435673, "ground_truth": 0}, {"key": "62481fda7e7b9714b994617909349550707fe8a7", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.8568123014006715, "ground_truth": 0}, {"key": "13943ef2d9c3b737c9a900f0cdb32a9c39121e6f", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.9473810430761287, "ground_truth": 0}, {"key": "13943ef2d9c3b737c9a900f0cdb32a9c39121e6f", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.9717790130185113, "ground_truth": 0}, {"key": "13943ef2d9c3b737c9a900f0cdb32a9c39121e6f", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.9118099550920704, "ground_truth": 0}, {"key": "13943ef2d9c3b737c9a900f0cdb32a9c39121e6f", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.9686195689866905, "ground_truth": 0}, {"key": "13943ef2d9c3b737c9a900f0cdb32a9c39121e6f", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.9425067237579602, "ground_truth": 0}, {"key": "0c25e0cd62589fde1b378606febbcc5a2bafc770", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.9086179042569594, "ground_truth": 0}, {"key": "0c25e0cd62589fde1b378606febbcc5a2bafc770", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.8198933351040306, "ground_truth": 0}, {"key": "0c25e0cd62589fde1b378606febbcc5a2bafc770", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.884837774196443, "ground_truth": 0}, {"key": "0c25e0cd62589fde1b378606febbcc5a2bafc770", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.9079671486229808, "ground_truth": 0}, {"key": "0c25e0cd62589fde1b378606febbcc5a2bafc770", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.8587185879228264, "ground_truth": 0}, {"key": "a86bc16fad35d84e988af4cc64bf14877337d47e", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.7563575493423956, "ground_truth": 0}, {"key": "a86bc16fad35d84e988af4cc64bf14877337d47e", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.8766343861069795, "ground_truth": 0}, {"key": "a86bc16fad35d84e988af4cc64bf14877337d47e", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.7356416295615545, "ground_truth": 0}, {"key": "a86bc16fad35d84e988af4cc64bf14877337d47e", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.7520125900851906, "ground_truth": 0}, {"key": "a86bc16fad35d84e988af4cc64bf14877337d47e", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.801935821021174, "ground_truth": 0}, {"key": "0f937bcc8cd07bab2d5aa9a4492d3c2430063b67", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.8164063644865194, "ground_truth": 0}, {"key": "0f937bcc8cd07bab2d5aa9a4492d3c2430063b67", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.8116760121326426, "ground_truth": 0}, {"key": "0f937bcc8cd07bab2d5aa9a4492d3c2430063b67", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.8856314798478109, "ground_truth": 0}, {"key": "0f937bcc8cd07bab2d5aa9a4492d3c2430063b67", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.852935466993063, "ground_truth": 0}, {"key": "0f937bcc8cd07bab2d5aa9a4492d3c2430063b67", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.8210441063923241, "ground_truth": 0}, {"key": "a6c0617d92807f05f02d767261c45b616382e499", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.8652240915492572, "ground_truth": 0}, {"key": "a6c0617d92807f05f02d767261c45b616382e499", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.8679338462602209, "ground_truth": 0}, {"key": "a6c0617d92807f05f02d767261c45b616382e499", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.7662936351744645, "ground_truth": 0}, {"key": "a6c0617d92807f05f02d767261c45b616382e499", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.8244619336510817, "ground_truth": 0}, {"key": "a6c0617d92807f05f02d767261c45b616382e499", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.869714584296508, "ground_truth": 0}, {"key": "4f45a0576d353fa9b5b9d1c8e3cc0e6a1cd4897b", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.860603620754304, "ground_truth": 0}, {"key": "4f45a0576d353fa9b5b9d1c8e3cc0e6a1cd4897b", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.8757869855434428, "ground_truth": 0}, {"key": "4f45a0576d353fa9b5b9d1c8e3cc0e6a1cd4897b", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.9213576162289244, "ground_truth": 0}, {"key": "4f45a0576d353fa9b5b9d1c8e3cc0e6a1cd4897b", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.8864204057137517, "ground_truth": 0}, {"key": "4f45a0576d353fa9b5b9d1c8e3cc0e6a1cd4897b", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.8774767860481402, "ground_truth": 0}, {"key": "f6d43a207c2b3c48e787087b345c23d2fb1dc92f", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.8887587867026121, "ground_truth": 0}, {"key": "f6d43a207c2b3c48e787087b345c23d2fb1dc92f", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.831143045562533, "ground_truth": 0}, {"key": "f6d43a207c2b3c48e787087b345c23d2fb1dc92f", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.8558511538308374, "ground_truth": 0}, {"key": "f6d43a207c2b3c48e787087b345c23d2fb1dc92f", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.8740772246584655, "ground_truth": 0}, {"key": "f6d43a207c2b3c48e787087b345c23d2fb1dc92f", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.8872045988588764, "ground_truth": 0}, {"key": "e0127487aee3a00fe164d72eb697221079518471", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.9669140223534001, "ground_truth": 0}, {"key": "e0127487aee3a00fe164d72eb697221079518471", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.9504109791918643, "ground_truth": 0}, {"key": "e0127487aee3a00fe164d72eb697221079518471", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.9381240142869185, "ground_truth": 0}, {"key": "e0127487aee3a00fe164d72eb697221079518471", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.9362850041394024, "ground_truth": 0}, {"key": "e0127487aee3a00fe164d72eb697221079518471", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.8947894668989606, "ground_truth": 0}, {"key": "2f3af8decce1c0a6cd22b21df96acd40b14bb62b", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.5755880112806785, "ground_truth": 0}, {"key": "2f3af8decce1c0a6cd22b21df96acd40b14bb62b", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.7264255948660402, "ground_truth": 0}, {"key": "2f3af8decce1c0a6cd22b21df96acd40b14bb62b", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.8019358041577496, "ground_truth": 0}, {"key": "2f3af8decce1c0a6cd22b21df96acd40b14bb62b", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.6020616198059789, "ground_truth": 0}, {"key": "2f3af8decce1c0a6cd22b21df96acd40b14bb62b", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.7279754491714621, "ground_truth": 0}, {"key": "13a366f303e6ea2f07c353a9f5fb49a44840f808", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.7122321958114105, "ground_truth": 0}, {"key": "13a366f303e6ea2f07c353a9f5fb49a44840f808", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.8407825810948029, "ground_truth": 0}, {"key": "13a366f303e6ea2f07c353a9f5fb49a44840f808", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.8407826081309158, "ground_truth": 0}, {"key": "13a366f303e6ea2f07c353a9f5fb49a44840f808", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.8479677570501499, "ground_truth": 0}, {"key": "13a366f303e6ea2f07c353a9f5fb49a44840f808", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.8962513603892749, "ground_truth": 0}, {"key": "ee36a8b5db09b9e9a6d462116539ffc095d5c017", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.7648916176778799, "ground_truth": 0}, {"key": "ee36a8b5db09b9e9a6d462116539ffc095d5c017", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.8723473715955488, "ground_truth": 0}, {"key": "ee36a8b5db09b9e9a6d462116539ffc095d5c017", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.7799928989629202, "ground_truth": 0}, {"key": "ee36a8b5db09b9e9a6d462116539ffc095d5c017", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.8255897237908923, "ground_truth": 0}, {"key": "ee36a8b5db09b9e9a6d462116539ffc095d5c017", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.7905302976007603, "ground_truth": 0}, {"key": "d3b3bcf90226a694361cb27f1a4d481c79b7368a", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.8210441221315158, "ground_truth": 0}, {"key": "d3b3bcf90226a694361cb27f1a4d481c79b7368a", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.838679767183951, "ground_truth": 0}, {"key": "d3b3bcf90226a694361cb27f1a4d481c79b7368a", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.9155072436595099, "ground_truth": 0}, {"key": "d3b3bcf90226a694361cb27f1a4d481c79b7368a", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.8933094078945572, "ground_truth": 0}, {"key": "d3b3bcf90226a694361cb27f1a4d481c79b7368a", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.8732148329546205, "ground_truth": 0}, {"key": "e5e837f2cc75fc44ebf826822aa4c9dc59344b8b", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.6876299987238016, "ground_truth": 0}, {"key": "e5e837f2cc75fc44ebf826822aa4c9dc59344b8b", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.785308566715231, "ground_truth": 0}, {"key": "e5e837f2cc75fc44ebf826822aa4c9dc59344b8b", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.7634837574339294, "ground_truth": 0}, {"key": "e5e837f2cc75fc44ebf826822aa4c9dc59344b8b", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.7201714994517885, "ground_truth": 0}, {"key": "e5e837f2cc75fc44ebf826822aa4c9dc59344b8b", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.5370413849828907, "ground_truth": 0}, {"key": "1317a869cc1d6d534a93eaad67fb6550aa155ae6", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.777299850975266, "ground_truth": 0}, {"key": "1317a869cc1d6d534a93eaad67fb6550aa155ae6", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.6001883570088142, "ground_truth": 0}, {"key": "1317a869cc1d6d534a93eaad67fb6550aa155ae6", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.6548947368118646, "ground_truth": 0}, {"key": "1317a869cc1d6d534a93eaad67fb6550aa155ae6", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.6992544333724948, "ground_truth": 0}, {"key": "1317a869cc1d6d534a93eaad67fb6550aa155ae6", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.7386690775546401, "ground_truth": 0}, {"key": "f856ca4cd15992e0e88ae9113bf31b2a5ab55072", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.9257686408720824, "ground_truth": 0}, {"key": "f856ca4cd15992e0e88ae9113bf31b2a5ab55072", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.9059898170355041, "ground_truth": 0}, {"key": "f856ca4cd15992e0e88ae9113bf31b2a5ab55072", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.9207896805964536, "ground_truth": 0}, {"key": "f856ca4cd15992e0e88ae9113bf31b2a5ab55072", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.8824278656929617, "ground_truth": 0}, {"key": "f856ca4cd15992e0e88ae9113bf31b2a5ab55072", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.782662502705678, "ground_truth": 0}, {"key": "438e8eaa1c64cb59288f9954355d0100181d19a2", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.8940517214350661, "ground_truth": 0}, {"key": "438e8eaa1c64cb59288f9954355d0100181d19a2", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.824461921689291, "ground_truth": 0}, {"key": "438e8eaa1c64cb59288f9954355d0100181d19a2", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.7690802330083936, "ground_truth": 0}, {"key": "438e8eaa1c64cb59288f9954355d0100181d19a2", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.850964703467764, "ground_truth": 0}, {"key": "438e8eaa1c64cb59288f9954355d0100181d19a2", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.8092759809657378, "ground_truth": 0}, {"key": "470618f9fd48a5d134a44b5de166b625f596a0b3", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.9086178915023321, "ground_truth": 0}, {"key": "470618f9fd48a5d134a44b5de166b625f596a0b3", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.8489721998560202, "ground_truth": 0}, {"key": "470618f9fd48a5d134a44b5de166b625f596a0b3", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.9149009622361437, "ground_truth": 0}, {"key": "470618f9fd48a5d134a44b5de166b625f596a0b3", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.9235923181028897, "ground_truth": 0}, {"key": "470618f9fd48a5d134a44b5de166b625f596a0b3", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.9219218408089125, "ground_truth": 0}, {"key": "751e8f720d24c57e79cf63d9a3f72cd80c5d9619", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.7918210644893731, "ground_truth": 0}, {"key": "751e8f720d24c57e79cf63d9a3f72cd80c5d9619", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.7122321927673323, "ground_truth": 0}, {"key": "751e8f720d24c57e79cf63d9a3f72cd80c5d9619", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.7233094576933875, "ground_truth": 0}, {"key": "751e8f720d24c57e79cf63d9a3f72cd80c5d9619", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.8519528180887096, "ground_truth": 0}, {"key": "751e8f720d24c57e79cf63d9a3f72cd80c5d9619", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.724870266830549, "ground_truth": 0}, {"key": "6a985a1090f146976d33c8b33342320a65a50211", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.8187367914144351, "ground_truth": 0}, {"key": "6a985a1090f146976d33c8b33342320a65a50211", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.8449215261447817, "ground_truth": 0}, {"key": "6a985a1090f146976d33c8b33342320a65a50211", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.8407825974578967, "ground_truth": 0}, {"key": "6a985a1090f146976d33c8b33342320a65a50211", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.8824278605516552, "ground_truth": 0}, {"key": "6a985a1090f146976d33c8b33342320a65a50211", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.8019358308219122, "ground_truth": 0}, {"key": "4640d2f968f31bcf384d8253e055611b10f4a38b", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.8019358253754427, "ground_truth": 0}, {"key": "4640d2f968f31bcf384d8253e055611b10f4a38b", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.81873679082217, "ground_truth": 0}, {"key": "4640d2f968f31bcf384d8253e055611b10f4a38b", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.7386690724296434, "ground_truth": 0}, {"key": "4640d2f968f31bcf384d8253e055611b10f4a38b", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.7008948096587033, "ground_truth": 0}, {"key": "4640d2f968f31bcf384d8253e055611b10f4a38b", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.7549149740725346, "ground_truth": 0}, {"key": "22e0c9ba3465840583a5fd79714d2f7663c7e3a1", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.7969253661260645, "ground_truth": 0}, {"key": "22e0c9ba3465840583a5fd79714d2f7663c7e3a1", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.8164063888786056, "ground_truth": 0}, {"key": "22e0c9ba3465840583a5fd79714d2f7663c7e3a1", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.8031738164241855, "ground_truth": 0}, {"key": "22e0c9ba3465840583a5fd79714d2f7663c7e3a1", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.833324592035957, "ground_truth": 0}, {"key": "22e0c9ba3465840583a5fd79714d2f7663c7e3a1", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.8080672296689, "ground_truth": 0}, {"key": "10dafcc21761c60f8fc5bd832daf8f21cf0fc66d", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.817574474354996, "ground_truth": 0}, {"key": "10dafcc21761c60f8fc5bd832daf8f21cf0fc66d", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.7905303133531366, "ground_truth": 0}, {"key": "10dafcc21761c60f8fc5bd832daf8f21cf0fc66d", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.8774767895646053, "ground_truth": 0}, {"key": "10dafcc21761c60f8fc5bd832daf8f21cf0fc66d", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.8354835498296781, "ground_truth": 0}, {"key": "10dafcc21761c60f8fc5bd832daf8f21cf0fc66d", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.8300437663029332, "ground_truth": 0}, {"key": "75da85a72e0028e1b07c65f6b771a1eaa20b4e04", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.8044059092145883, "ground_truth": 0}, {"key": "75da85a72e0028e1b07c65f6b771a1eaa20b4e04", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.8152324942218327, "ground_truth": 0}, {"key": "75da85a72e0028e1b07c65f6b771a1eaa20b4e04", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.8019358355460408, "ground_truth": 0}, {"key": "75da85a72e0028e1b07c65f6b771a1eaa20b4e04", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.8902942260984841, "ground_truth": 0}, {"key": "75da85a72e0028e1b07c65f6b771a1eaa20b4e04", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.8397339600373281, "ground_truth": 0}, {"key": "9166b4c77e919f7a7cc457f9df981512dea3694f", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.8092759853265582, "ground_truth": 0}, {"key": "9166b4c77e919f7a7cc457f9df981512dea3694f", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.7918210513012, "ground_truth": 0}, {"key": "9166b4c77e919f7a7cc457f9df981512dea3694f", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.8397339651455191, "ground_truth": 0}, {"key": "9166b4c77e919f7a7cc457f9df981512dea3694f", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.8615382006043584, "ground_truth": 0}, {"key": "9166b4c77e919f7a7cc457f9df981512dea3694f", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.87407724537163, "ground_truth": 0}, {"key": "81e50c6cdbea4e55af6307d653135ef395b6d7fe", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.9299510418267704, "ground_truth": 0}, {"key": "81e50c6cdbea4e55af6307d653135ef395b6d7fe", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.8783142437394696, "ground_truth": 0}, {"key": "81e50c6cdbea4e55af6307d653135ef395b6d7fe", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.9686195700185753, "ground_truth": 0}, {"key": "81e50c6cdbea4e55af6307d653135ef395b6d7fe", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.8187368076175463, "ground_truth": 0}, {"key": "81e50c6cdbea4e55af6307d653135ef395b6d7fe", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.960361158919117, "ground_truth": 0}, {"key": "59fa6c3439d216272cc845d35627f8eb11b08a6d", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.9618217262302138, "ground_truth": 0}, {"key": "59fa6c3439d216272cc845d35627f8eb11b08a6d", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.9709092446606963, "ground_truth": 0}, {"key": "59fa6c3439d216272cc845d35627f8eb11b08a6d", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.954984466134616, "ground_truth": 0}, {"key": "59fa6c3439d216272cc845d35627f8eb11b08a6d", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.9504109766486074, "ground_truth": 0}, {"key": "59fa6c3439d216272cc845d35627f8eb11b08a6d", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.953621792224042, "ground_truth": 0}, {"key": "2eff3ba44cfaefbff89ebc764828ae9e4d477c9b", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.9376689634047547, "ground_truth": 0}, {"key": "2eff3ba44cfaefbff89ebc764828ae9e4d477c9b", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.9420819144534256, "ground_truth": 0}, {"key": "2eff3ba44cfaefbff89ebc764828ae9e4d477c9b", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.9092645143535938, "ground_truth": 0}, {"key": "2eff3ba44cfaefbff89ebc764828ae9e4d477c9b", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.9230391617112683, "ground_truth": 0}, {"key": "2eff3ba44cfaefbff89ebc764828ae9e4d477c9b", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.9358173541033192, "ground_truth": 0}, {"key": "74698ee383888faf5a49b32ecb8211b888270b76", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.783988460946613, "ground_truth": 0}, {"key": "74698ee383888faf5a49b32ecb8211b888270b76", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.8732148221980859, "ground_truth": 0}, {"key": "74698ee383888faf5a49b32ecb8211b888270b76", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.898410554864136, "ground_truth": 0}, {"key": "74698ee383888faf5a49b32ecb8211b888270b76", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.8652240760184572, "ground_truth": 0}, {"key": "74698ee383888faf5a49b32ecb8211b888270b76", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.8056321815888436, "ground_truth": 0}, {"key": "79a6d24f452d8c1cef47ab224fd2083b0d08324c", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.9445872066339812, "ground_truth": 0}, {"key": "79a6d24f452d8c1cef47ab224fd2083b0d08324c", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.9566342023580602, "ground_truth": 0}, {"key": "79a6d24f452d8c1cef47ab224fd2083b0d08324c", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.942506714138643, "ground_truth": 0}, {"key": "79a6d24f452d8c1cef47ab224fd2083b0d08324c", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.9492946378581404, "ground_truth": 0}, {"key": "79a6d24f452d8c1cef47ab224fd2083b0d08324c", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.9686195677631726, "ground_truth": 0}, {"key": "50f2041a2bed7f316d3254192c4158095eeec2e9", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.707404684701369, "ground_truth": 0}, {"key": "50f2041a2bed7f316d3254192c4158095eeec2e9", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.7279754445007899, "ground_truth": 0}, {"key": "50f2041a2bed7f316d3254192c4158095eeec2e9", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.8068526266205144, "ground_truth": 0}, {"key": "50f2041a2bed7f316d3254192c4158095eeec2e9", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.7879311981603099, "ground_truth": 0}, {"key": "50f2041a2bed7f316d3254192c4158095eeec2e9", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.8976952947174813, "ground_truth": 0}, {"key": "de6ed8db6d639706f2c5015c699fc578e4aa43ec", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.9019206754551048, "ground_truth": 0}, {"key": "de6ed8db6d639706f2c5015c699fc578e4aa43ec", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.9073122241917684, "ground_truth": 0}, {"key": "de6ed8db6d639706f2c5015c699fc578e4aa43ec", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.8596637420614521, "ground_truth": 0}, {"key": "de6ed8db6d639706f2c5015c699fc578e4aa43ec", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.8386797592559716, "ground_truth": 0}, {"key": "de6ed8db6d639706f2c5015c699fc578e4aa43ec", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.9241418165377819, "ground_truth": 0}, {"key": "8abb66a9697a8c59348fcc79de126691e394bded", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.9458012698299326, "ground_truth": 0}, {"key": "8abb66a9697a8c59348fcc79de126691e394bded", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.8688267819912847, "ground_truth": 0}, {"key": "8abb66a9697a8c59348fcc79de126691e394bded", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.9473810467594581, "ground_truth": 0}, {"key": "8abb66a9697a8c59348fcc79de126691e394bded", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.9273632941328469, "ground_truth": 0}, {"key": "8abb66a9697a8c59348fcc79de126691e394bded", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.9099069978069902, "ground_truth": 0}, {"key": "11ec3be451b57e4312b44eeabb3ae441435c662e", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.8397339698344317, "ground_truth": 0}, {"key": "11ec3be451b57e4312b44eeabb3ae441435c662e", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.8210441121935869, "ground_truth": 0}, {"key": "11ec3be451b57e4312b44eeabb3ae441435c662e", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.7534666685560877, "ground_truth": 0}, {"key": "11ec3be451b57e4312b44eeabb3ae441435c662e", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.7718435076301637, "ground_truth": 0}, {"key": "11ec3be451b57e4312b44eeabb3ae441435c662e", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.8322366641286028, "ground_truth": 0}, {"key": "eed527dece78deffed54a7cdd8516c4d57a90011", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.9711290921910485, "ground_truth": 0}, {"key": "eed527dece78deffed54a7cdd8516c4d57a90011", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.9857180665913846, "ground_truth": 0}, {"key": "eed527dece78deffed54a7cdd8516c4d57a90011", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.9637799409110662, "ground_truth": 0}, {"key": "eed527dece78deffed54a7cdd8516c4d57a90011", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.9711290924343153, "ground_truth": 0}, {"key": "eed527dece78deffed54a7cdd8516c4d57a90011", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.9674102584435188, "ground_truth": 0}, {"key": "803c0dc8b3d2eb528fd084b613dfc29d98151d72", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.8848377639970804, "ground_truth": 0}, {"key": "803c0dc8b3d2eb528fd084b613dfc29d98151d72", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.8529354731149673, "ground_truth": 0}, {"key": "803c0dc8b3d2eb528fd084b613dfc29d98151d72", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.8688267702774067, "ground_truth": 0}, {"key": "803c0dc8b3d2eb528fd084b613dfc29d98151d72", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.9224823429294265, "ground_truth": 0}, {"key": "803c0dc8b3d2eb528fd084b613dfc29d98151d72", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.8962513678590096, "ground_truth": 0}, {"key": "d4fb4cca753c0f5586bd93bb124b0491711396d9", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.7279754425581949, "ground_truth": 0}, {"key": "d4fb4cca753c0f5586bd93bb124b0491711396d9", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.7799929048355655, "ground_truth": 0}, {"key": "d4fb4cca753c0f5586bd93bb124b0491711396d9", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.78923369761463, "ground_truth": 0}, {"key": "d4fb4cca753c0f5586bd93bb124b0491711396d9", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.8587185856348408, "ground_truth": 0}, {"key": "d4fb4cca753c0f5586bd93bb124b0491711396d9", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.7217431997765368, "ground_truth": 0}, {"key": "723443b1c16e2276a1aa03259a600044e86c2538", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.7476159496188589, "ground_truth": 0}, {"key": "723443b1c16e2276a1aa03259a600044e86c2538", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.7853085782696774, "ground_truth": 0}, {"key": "723443b1c16e2276a1aa03259a600044e86c2538", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.7866228081855231, "ground_truth": 0}, {"key": "723443b1c16e2276a1aa03259a600044e86c2538", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.8643104579084886, "ground_truth": 0}, {"key": "723443b1c16e2276a1aa03259a600044e86c2538", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.8438951050507081, "ground_truth": 0}, {"key": "b30a8f4dbb4f8375a8a9c2ccb4f658cc66dca0f5", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.8407825969249534, "ground_truth": 0}, {"key": "b30a8f4dbb4f8375a8a9c2ccb4f658cc66dca0f5", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.7745833966031846, "ground_truth": 0}, {"key": "b30a8f4dbb4f8375a8a9c2ccb4f658cc66dca0f5", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.873214830686134, "ground_truth": 0}, {"key": "b30a8f4dbb4f8375a8a9c2ccb4f658cc66dca0f5", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.8947894637963998, "ground_truth": 0}, {"key": "b30a8f4dbb4f8375a8a9c2ccb4f658cc66dca0f5", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.9196425329574353, "ground_truth": 0}, {"key": "f874dc1da36d2c45a65f78dc0dc9dcdf5846c3c9", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.8807970823781752, "ground_truth": 0}, {"key": "f874dc1da36d2c45a65f78dc0dc9dcdf5846c3c9", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.8872045893053154, "ground_truth": 0}, {"key": "f874dc1da36d2c45a65f78dc0dc9dcdf5846c3c9", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.8469578432329194, "ground_truth": 0}, {"key": "f874dc1da36d2c45a65f78dc0dc9dcdf5846c3c9", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.8998277811517843, "ground_truth": 0}, {"key": "f874dc1da36d2c45a65f78dc0dc9dcdf5846c3c9", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.8872045914443886, "ground_truth": 0}, {"key": "60fc2801c429858cc0a87e547f1c30e34a7a96f3", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.8289388042360676, "ground_truth": 0}, {"key": "60fc2801c429858cc0a87e547f1c30e34a7a96f3", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.8705972654439679, "ground_truth": 0}, {"key": "60fc2801c429858cc0a87e547f1c30e34a7a96f3", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.8289388065773956, "ground_truth": 0}, {"key": "60fc2801c429858cc0a87e547f1c30e34a7a96f3", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.7431680159340425, "ground_truth": 0}, {"key": "60fc2801c429858cc0a87e547f1c30e34a7a96f3", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.7826625107430238, "ground_truth": 0}, {"key": "d885b755dab03a11c7e3b19455b82859a6e1f76b", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.9522199318540852, "ground_truth": 0}, {"key": "d885b755dab03a11c7e3b19455b82859a6e1f76b", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.9343951655316848, "ground_truth": 0}, {"key": "d885b755dab03a11c7e3b19455b82859a6e1f76b", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.9224823451885213, "ground_truth": 0}, {"key": "d885b755dab03a11c7e3b19455b82859a6e1f76b", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.8895288459397676, "ground_truth": 0}, {"key": "d885b755dab03a11c7e3b19455b82859a6e1f76b", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.9278877998394021, "ground_truth": 0}, {"key": "9ce486aae2ad61c78b2e44d2617276a470c9f600", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.8895288552313078, "ground_truth": 0}, {"key": "9ce486aae2ad61c78b2e44d2617276a470c9f600", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.8879840440874303, "ground_truth": 0}, {"key": "9ce486aae2ad61c78b2e44d2617276a470c9f600", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.9230391634011369, "ground_truth": 0}, {"key": "9ce486aae2ad61c78b2e44d2617276a470c9f600", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.8418256411126802, "ground_truth": 0}, {"key": "9ce486aae2ad61c78b2e44d2617276a470c9f600", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.8509646985932048, "ground_truth": 0}, {"key": "162e54974cad1d0e067a97e37175951c26f13a0e", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.9511422204624423, "ground_truth": 0}, {"key": "162e54974cad1d0e067a97e37175951c26f13a0e", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.9092645139945071, "ground_truth": 0}, {"key": "162e54974cad1d0e067a97e37175951c26f13a0e", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.8940517203708446, "ground_truth": 0}, {"key": "162e54974cad1d0e067a97e37175951c26f13a0e", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.9585377233208293, "ground_truth": 0}, {"key": "162e54974cad1d0e067a97e37175951c26f13a0e", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.9695556519410291, "ground_truth": 0}, {"key": "03a0cef9c902928979ef731616fb96bd1fb10f9f", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.9092645142375028, "ground_truth": 0}, {"key": "03a0cef9c902928979ef731616fb96bd1fb10f9f", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.9678992916106871, "ground_truth": 0}, {"key": "03a0cef9c902928979ef731616fb96bd1fb10f9f", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.9449947139685647, "ground_truth": 0}, {"key": "03a0cef9c902928979ef731616fb96bd1fb10f9f", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.9142907268844163, "ground_truth": 0}, {"key": "03a0cef9c902928979ef731616fb96bd1fb10f9f", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.8529354778146317, "ground_truth": 0}, {"key": "6f64897fc65e1ba7531a4830a7d935ab15d8bec6", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.8056321722897313, "ground_truth": 0}, {"key": "6f64897fc65e1ba7531a4830a7d935ab15d8bec6", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.7956580951194716, "ground_truth": 0}, {"key": "6f64897fc65e1ba7531a4830a7d935ab15d8bec6", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.8688267802893785, "ground_truth": 0}, {"key": "6f64897fc65e1ba7531a4830a7d935ab15d8bec6", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.8116760063781323, "ground_truth": 0}, {"key": "6f64897fc65e1ba7531a4830a7d935ab15d8bec6", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.8006919898351966, "ground_truth": 0}, {"key": "0d7383a44955b41c5a472151a35a842751f0004c", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.6169358359245105, "ground_truth": 0}, {"key": "0d7383a44955b41c5a472151a35a842751f0004c", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.8128673241658682, "ground_truth": 0}, {"key": "0d7383a44955b41c5a472151a35a842751f0004c", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.7371581474910168, "ground_truth": 0}, {"key": "0d7383a44955b41c5a472151a35a842751f0004c", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.7931059471053279, "ground_truth": 0}, {"key": "0d7383a44955b41c5a472151a35a842751f0004c", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.793105952874953, "ground_truth": 0}, {"key": "2fddefe691f7849048548a15f6533339d4a25bfd", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.9353465072817605, "ground_truth": 0}, {"key": "2fddefe691f7849048548a15f6533339d4a25bfd", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.9381240155367083, "ground_truth": 0}, {"key": "2fddefe691f7849048548a15f6533339d4a25bfd", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.9136765238478506, "ground_truth": 0}, {"key": "2fddefe691f7849048548a15f6533339d4a25bfd", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.9458012676846362, "ground_truth": 0}, {"key": "2fddefe691f7849048548a15f6533339d4a25bfd", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.9202179827879509, "ground_truth": 0}, {"key": "e35ec8afe496d466d673ac67d80ec5c21b163410", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.7981867762869747, "ground_truth": 0}, {"key": "e35ec8afe496d466d673ac67d80ec5c21b163410", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.7745833966031846, "ground_truth": 0}, {"key": "e35ec8afe496d466d673ac67d80ec5c21b163410", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.8376199692331686, "ground_truth": 0}, {"key": "e35ec8afe496d466d673ac67d80ec5c21b163410", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.8969755728011891, "ground_truth": 0}, {"key": "e35ec8afe496d466d673ac67d80ec5c21b163410", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.894789464933916, "ground_truth": 0}, {"key": "b4aa207f0723ae8a731dbc07ecdb03a68a42031f", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.8807970810534105, "ground_truth": 0}, {"key": "b4aa207f0723ae8a731dbc07ecdb03a68a42031f", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.7534666503715818, "ground_truth": 0}, {"key": "b4aa207f0723ae8a731dbc07ecdb03a68a42031f", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.8469578396284142, "ground_truth": 0}, {"key": "b4aa207f0723ae8a731dbc07ecdb03a68a42031f", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.8311430448458568, "ground_truth": 0}, {"key": "b4aa207f0723ae8a731dbc07ecdb03a68a42031f", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.8354835476250972, "ground_truth": 0}, {"key": "a65ecd71682863f7b12ca11ab8ac23b39ae302c4", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.8255897204053402, "ground_truth": 0}, {"key": "a65ecd71682863f7b12ca11ab8ac23b39ae302c4", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.835483544969733, "ground_truth": 0}, {"key": "a65ecd71682863f7b12ca11ab8ac23b39ae302c4", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.7839884601353091, "ground_truth": 0}, {"key": "a65ecd71682863f7b12ca11ab8ac23b39ae302c4", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.7879312009158174, "ground_truth": 0}, {"key": "a65ecd71682863f7b12ca11ab8ac23b39ae302c4", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.8128673068265202, "ground_truth": 0}, {"key": "215a2a64c7bd36360f76ec5e159690de07d7d959", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.7185943951957486, "ground_truth": 0}, {"key": "215a2a64c7bd36360f76ec5e159690de07d7d959", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.8104789057073252, "ground_truth": 0}, {"key": "215a2a64c7bd36360f76ec5e159690de07d7d959", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.7634837680232094, "ground_truth": 0}, {"key": "215a2a64c7bd36360f76ec5e159690de07d7d959", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.7074046933955338, "ground_truth": 0}, {"key": "215a2a64c7bd36360f76ec5e159690de07d7d959", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.8198933478861906, "ground_truth": 0}, {"key": "39074eb06df4966d1e06f76ad2f0713b31335fe5", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.7074047203770428, "ground_truth": 0}, {"key": "39074eb06df4966d1e06f76ad2f0713b31335fe5", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.8187367836963071, "ground_truth": 0}, {"key": "39074eb06df4966d1e06f76ad2f0713b31335fe5", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.6909762881545167, "ground_truth": 0}, {"key": "39074eb06df4966d1e06f76ad2f0713b31335fe5", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.8031737839819304, "ground_truth": 0}, {"key": "39074eb06df4966d1e06f76ad2f0713b31335fe5", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.7826624712067914, "ground_truth": 0}, {"key": "3cae0d9bcf97b5d182b20a31aaea3f41cd7bf599", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.8322366527883001, "ground_truth": 0}, {"key": "3cae0d9bcf97b5d182b20a31aaea3f41cd7bf599", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.9161096130675186, "ground_truth": 0}, {"key": "3cae0d9bcf97b5d182b20a31aaea3f41cd7bf599", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.9465966674000768, "ground_truth": 0}, {"key": "3cae0d9bcf97b5d182b20a31aaea3f41cd7bf599", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.8354835506383991, "ground_truth": 0}, {"key": "3cae0d9bcf97b5d182b20a31aaea3f41cd7bf599", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.9066531215859583, "ground_truth": 0}, {"key": "6a9ead70f9423e494c466189bc6d907071547f42", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.828938815987635, "ground_truth": 0}, {"key": "6a9ead70f9423e494c466189bc6d907071547f42", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.8267117845505928, "ground_truth": 0}, {"key": "6a9ead70f9423e494c466189bc6d907071547f42", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.8697145828190944, "ground_truth": 0}, {"key": "6a9ead70f9423e494c466189bc6d907071547f42", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.924687693574553, "ground_truth": 0}, {"key": "6a9ead70f9423e494c466189bc6d907071547f42", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.8289388152979359, "ground_truth": 0}, {"key": "9a15663058028878027f6aa039fb3185c2ff52c8", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.859663750366236, "ground_truth": 0}, {"key": "9a15663058028878027f6aa039fb3185c2ff52c8", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.8459424364002472, "ground_truth": 0}, {"key": "9a15663058028878027f6aa039fb3185c2ff52c8", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.8864204168359963, "ground_truth": 0}, {"key": "9a15663058028878027f6aa039fb3185c2ff52c8", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.831143050067302, "ground_truth": 0}, {"key": "9a15663058028878027f6aa039fb3185c2ff52c8", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.8568122929824967, "ground_truth": 0}, {"key": "83cb0c7e79d4c71703e1bd5fc346fe68be8b8b13", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.7534666524187178, "ground_truth": 0}, {"key": "83cb0c7e79d4c71703e1bd5fc346fe68be8b8b13", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.800691980546006, "ground_truth": 0}, {"key": "83cb0c7e79d4c71703e1bd5fc346fe68be8b8b13", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.8311430528692049, "ground_truth": 0}, {"key": "83cb0c7e79d4c71703e1bd5fc346fe68be8b8b13", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.8354835364708094, "ground_truth": 0}, {"key": "83cb0c7e79d4c71703e1bd5fc346fe68be8b8b13", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.8233283904248319, "ground_truth": 0}, {"key": "5eb63517219a5d2aeebd21aa66d9b69c52cfb208", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.9012274064336072, "ground_truth": 0}, {"key": "5eb63517219a5d2aeebd21aa66d9b69c52cfb208", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.8955226801772176, "ground_truth": 0}, {"key": "5eb63517219a5d2aeebd21aa66d9b69c52cfb208", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.9066531271305946, "ground_truth": 0}, {"key": "5eb63517219a5d2aeebd21aa66d9b69c52cfb208", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.8407825917891956, "ground_truth": 0}, {"key": "5eb63517219a5d2aeebd21aa66d9b69c52cfb208", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.8749346179579408, "ground_truth": 0}, {"key": "4a1de02b50578df33ea7b0cb384bdd6aaf4ee119", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.7416740128721676, "ground_truth": 0}, {"key": "4a1de02b50578df33ea7b0cb384bdd6aaf4ee119", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.766293654907698, "ground_truth": 0}, {"key": "4a1de02b50578df33ea7b0cb384bdd6aaf4ee119", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.7853085887802308, "ground_truth": 0}, {"key": "4a1de02b50578df33ea7b0cb384bdd6aaf4ee119", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.8019358379962386, "ground_truth": 0}, {"key": "4a1de02b50578df33ea7b0cb384bdd6aaf4ee119", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.7745833944677412, "ground_truth": 0}, {"key": "ddedfc2a349fb607ed7efeda1660e9807454ddb7", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.842863150566664, "ground_truth": 0}, {"key": "ddedfc2a349fb607ed7efeda1660e9807454ddb7", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.8774767886965422, "ground_truth": 0}, {"key": "ddedfc2a349fb607ed7efeda1660e9807454ddb7", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.8322366589257724, "ground_truth": 0}, {"key": "ddedfc2a349fb607ed7efeda1660e9807454ddb7", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.8210441150576553, "ground_truth": 0}, {"key": "ddedfc2a349fb607ed7efeda1660e9807454ddb7", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.8354835310083708, "ground_truth": 0}, {"key": "1cce8238a161fda411022c350d2b9a49072f366f", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.6943026787265946, "ground_truth": 0}, {"key": "1cce8238a161fda411022c350d2b9a49072f366f", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.8044059136414095, "ground_truth": 0}, {"key": "1cce8238a161fda411022c350d2b9a49072f366f", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.6740504966192928, "ground_truth": 0}, {"key": "1cce8238a161fda411022c350d2b9a49072f366f", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.9053222935777978, "ground_truth": 0}, {"key": "1cce8238a161fda411022c350d2b9a49072f366f", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.6619228766367298, "ground_truth": 0}, {"key": "0612042c0c7d5cf6459f5435402919673c8c552f", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.850964706243976, "ground_truth": 0}, {"key": "0612042c0c7d5cf6459f5435402919673c8c552f", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.8376199761321353, "ground_truth": 0}, {"key": "0612042c0c7d5cf6459f5435402919673c8c552f", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.878314247754629, "ground_truth": 0}, {"key": "0612042c0c7d5cf6459f5435402919673c8c552f", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.8606036174546122, "ground_truth": 0}, {"key": "0612042c0c7d5cf6459f5435402919673c8c552f", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.8539127458467984, "ground_truth": 0}, {"key": "cbe1f7ee7f5d619093684cc123e3908e39d79c92", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.9289263301248054, "ground_truth": 0}, {"key": "cbe1f7ee7f5d619093684cc123e3908e39d79c92", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.8568122880898925, "ground_truth": 0}, {"key": "cbe1f7ee7f5d619093684cc123e3908e39d79c92", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.9092645096229075, "ground_truth": 0}, {"key": "cbe1f7ee7f5d619093684cc123e3908e39d79c92", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.8872045998579762, "ground_truth": 0}, {"key": "cbe1f7ee7f5d619093684cc123e3908e39d79c92", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.9449947122922627, "ground_truth": 0}, {"key": "42be47d5986a9a55b413eb57359d2d8c51b59024", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.8187367845541492, "ground_truth": 0}, {"key": "42be47d5986a9a55b413eb57359d2d8c51b59024", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.89405172471319, "ground_truth": 0}, {"key": "42be47d5986a9a55b413eb57359d2d8c51b59024", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.7956580925238748, "ground_truth": 0}, {"key": "42be47d5986a9a55b413eb57359d2d8c51b59024", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.8233283898812064, "ground_truth": 0}, {"key": "42be47d5986a9a55b413eb57359d2d8c51b59024", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.872347383901959, "ground_truth": 0}, {"key": "9f997964709283520a65d2ce75de7c8b154ce351", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.9111797087890068, "ground_truth": 0}, {"key": "9f997964709283520a65d2ce75de7c8b154ce351", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.8791467655469996, "ground_truth": 0}, {"key": "9f997964709283520a65d2ce75de7c8b154ce351", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.8895288534815812, "ground_truth": 0}, {"key": "9f997964709283520a65d2ce75de7c8b154ce351", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.8670357593848057, "ground_truth": 0}, {"key": "9f997964709283520a65d2ce75de7c8b154ce351", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.8791467639513647, "ground_truth": 0}, {"key": "57da930302d81b46438b0f715a5218b7174a5611", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.9263037339895428, "ground_truth": 0}, {"key": "57da930302d81b46438b0f715a5218b7174a5611", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.8887587912214887, "ground_truth": 0}, {"key": "57da930302d81b46438b0f715a5218b7174a5611", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.9362850048111281, "ground_truth": 0}, {"key": "57da930302d81b46438b0f715a5218b7174a5611", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.9224823379178816, "ground_truth": 0}, {"key": "57da930302d81b46438b0f715a5218b7174a5611", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.936749478921947, "ground_truth": 0}, {"key": "bc639974d283826b3b928bf90f0951652db71fd4", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.8104789049595086, "ground_truth": 0}, {"key": "bc639974d283826b3b928bf90f0951652db71fd4", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.8832359844860325, "ground_truth": 0}, {"key": "bc639974d283826b3b928bf90f0951652db71fd4", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.8856314743660842, "ground_truth": 0}, {"key": "bc639974d283826b3b928bf90f0951652db71fd4", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.743167987579778, "ground_truth": 0}, {"key": "bc639974d283826b3b928bf90f0951652db71fd4", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.8624675353635396, "ground_truth": 0}, {"key": "304002bc095b57d14b728ccfb8d704ef39f28813", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.8998277765714938, "ground_truth": 0}, {"key": "304002bc095b57d14b728ccfb8d704ef39f28813", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.9066531281661749, "ground_truth": 0}, {"key": "304002bc095b57d14b728ccfb8d704ef39f28813", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.8670357476736013, "ground_truth": 0}, {"key": "304002bc095b57d14b728ccfb8d704ef39f28813", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.8354835374535686, "ground_truth": 0}, {"key": "304002bc095b57d14b728ccfb8d704ef39f28813", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.8233284005165425, "ground_truth": 0}, {"key": "fab941df6ecc8251b49d28715504baf4ac31dcf9", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.8984105490365862, "ground_truth": 0}, {"key": "fab941df6ecc8251b49d28715504baf4ac31dcf9", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.8386797567041556, "ground_truth": 0}, {"key": "fab941df6ecc8251b49d28715504baf4ac31dcf9", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.7879312052306663, "ground_truth": 0}, {"key": "fab941df6ecc8251b49d28715504baf4ac31dcf9", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.8998277777285146, "ground_truth": 0}, {"key": "fab941df6ecc8251b49d28715504baf4ac31dcf9", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.8376199649231332, "ground_truth": 0}, {"key": "92dec9732f4244771770150d82cd6086f40e5621", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.7905303275949463, "ground_truth": 0}, {"key": "92dec9732f4244771770150d82cd6086f40e5621", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.8740772410929459, "ground_truth": 0}, {"key": "92dec9732f4244771770150d82cd6086f40e5621", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.692641974922255, "ground_truth": 0}, {"key": "92dec9732f4244771770150d82cd6086f40e5621", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.7106283129911815, "ground_truth": 0}, {"key": "92dec9732f4244771770150d82cd6086f40e5621", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.858718570887029, "ground_truth": 0}, {"key": "d2ed554726c632af6e2130a580964a261f8c2e60", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.8333245910373226, "ground_truth": 0}, {"key": "d2ed554726c632af6e2130a580964a261f8c2e60", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.8333246009189041, "ground_truth": 0}, {"key": "d2ed554726c632af6e2130a580964a261f8c2e60", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.8449215322306933, "ground_truth": 0}, {"key": "d2ed554726c632af6e2130a580964a261f8c2e60", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.8962513770851909, "ground_truth": 0}, {"key": "d2ed554726c632af6e2130a580964a261f8c2e60", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.8499711739961712, "ground_truth": 0}, {"key": "84ab5256295369509813877f5000bb7e01e7f641", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.7931059597489536, "ground_truth": 0}, {"key": "84ab5256295369509813877f5000bb7e01e7f641", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.8187367884733543, "ground_truth": 0}, {"key": "84ab5256295369509813877f5000bb7e01e7f641", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.8080672236374875, "ground_truth": 0}, {"key": "84ab5256295369509813877f5000bb7e01e7f641", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.8548846428844985, "ground_truth": 0}, {"key": "84ab5256295369509813877f5000bb7e01e7f641", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.7325918332895348, "ground_truth": 0}, {"key": "0e3f2fa30b711144fd8e49dedd6c248542a9083c", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.9086179102852351, "ground_truth": 0}, {"key": "0e3f2fa30b711144fd8e49dedd6c248542a9083c", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.869714576391094, "ground_truth": 0}, {"key": "0e3f2fa30b711144fd8e49dedd6c248542a9083c", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.9092645123627806, "ground_truth": 0}, {"key": "0e3f2fa30b711144fd8e49dedd6c248542a9083c", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.8519528025652233, "ground_truth": 0}, {"key": "0e3f2fa30b711144fd8e49dedd6c248542a9083c", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.8479677528512827, "ground_truth": 0}, {"key": "67ab697c3e2d707e3b7d070199b065b1541c8925", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.8164063798395526, "ground_truth": 0}, {"key": "67ab697c3e2d707e3b7d070199b065b1541c8925", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.7892336968374879, "ground_truth": 0}, {"key": "67ab697c3e2d707e3b7d070199b065b1541c8925", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.8864204047582525, "ground_truth": 0}, {"key": "67ab697c3e2d707e3b7d070199b065b1541c8925", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.6442251242659378, "ground_truth": 0}, {"key": "67ab697c3e2d707e3b7d070199b065b1541c8925", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.7879312103617335, "ground_truth": 0}, {"key": "71537a701b69838dcb68ae310c7b3bfb375c1344", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.6370308027469784, "ground_truth": 0}, {"key": "71537a701b69838dcb68ae310c7b3bfb375c1344", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.7606506563451411, "ground_truth": 0}, {"key": "71537a701b69838dcb68ae310c7b3bfb375c1344", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.6959583251595577, "ground_truth": 0}, {"key": "71537a701b69838dcb68ae310c7b3bfb375c1344", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.6548947148051241, "ground_truth": 0}, {"key": "71537a701b69838dcb68ae310c7b3bfb375c1344", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.682573724933141, "ground_truth": 0}, {"key": "83989da5142972bb45c7f1e25ea60c6b101a9987", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.8991213900960461, "ground_truth": 0}, {"key": "83989da5142972bb45c7f1e25ea60c6b101a9987", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.9241418188005545, "ground_truth": 0}, {"key": "83989da5142972bb45c7f1e25ea60c6b101a9987", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.8774767900059499, "ground_truth": 0}, {"key": "83989da5142972bb45c7f1e25ea60c6b101a9987", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.8428631386303282, "ground_truth": 0}, {"key": "83989da5142972bb45c7f1e25ea60c6b101a9987", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.9309620720707491, "ground_truth": 0}, {"key": "cc432e8a26891d7fcb62b112f868e994532a7ba7", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.78398846827538, "ground_truth": 0}, {"key": "cc432e8a26891d7fcb62b112f868e994532a7ba7", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.7549149862976022, "ground_truth": 0}, {"key": "cc432e8a26891d7fcb62b112f868e994532a7ba7", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.622459323210433, "ground_truth": 0}, {"key": "cc432e8a26891d7fcb62b112f868e994532a7ba7", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.6406358563466474, "ground_truth": 0}, {"key": "cc432e8a26891d7fcb62b112f868e994532a7ba7", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.7577943636385995, "ground_truth": 0}, {"key": "ef024e4ca04bd445d2915e7fe5c2c3c9b6f723a2", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.800691989616497, "ground_truth": 0}, {"key": "ef024e4ca04bd445d2915e7fe5c2c3c9b6f723a2", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.837619975036135, "ground_truth": 0}, {"key": "ef024e4ca04bd445d2915e7fe5c2c3c9b6f723a2", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.822189136078504, "ground_truth": 0}, {"key": "ef024e4ca04bd445d2915e7fe5c2c3c9b6f723a2", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.8499711809831623, "ground_truth": 0}, {"key": "ef024e4ca04bd445d2915e7fe5c2c3c9b6f723a2", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.8376199793070228, "ground_truth": 0}, {"key": "dfc606b97c43ac249d72cff2fe812213987a37a2", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.7401743688975194, "ground_truth": 0}, {"key": "dfc606b97c43ac249d72cff2fe812213987a37a2", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.8568122948577868, "ground_truth": 0}, {"key": "dfc606b97c43ac249d72cff2fe812213987a37a2", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.8333245915274259, "ground_truth": 0}, {"key": "dfc606b97c43ac249d72cff2fe812213987a37a2", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.7563575437256639, "ground_truth": 0}, {"key": "dfc606b97c43ac249d72cff2fe812213987a37a2", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.799442316483092, "ground_truth": 0}, {"key": "087ac92e2ca469b5ca6277950e63b2f0706d0de2", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.8092759627073657, "ground_truth": 0}, {"key": "087ac92e2ca469b5ca6277950e63b2f0706d0de2", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.750552772134452, "ground_truth": 0}, {"key": "087ac92e2ca469b5ca6277950e63b2f0706d0de2", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.8300437587744496, "ground_truth": 0}, {"key": "087ac92e2ca469b5ca6277950e63b2f0706d0de2", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.8116760215559923, "ground_truth": 0}, {"key": "087ac92e2ca469b5ca6277950e63b2f0706d0de2", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.7090191352998166, "ground_truth": 0}, {"key": "a1abb9ce1c76a6c390233d8ec934cfb34bc35215", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.925229952044497, "ground_truth": 0}, {"key": "a1abb9ce1c76a6c390233d8ec934cfb34bc35215", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.8799743684848704, "ground_truth": 0}, {"key": "a1abb9ce1c76a6c390233d8ec934cfb34bc35215", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.8799743642712927, "ground_truth": 0}, {"key": "a1abb9ce1c76a6c390233d8ec934cfb34bc35215", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.905322298025918, "ground_truth": 0}, {"key": "a1abb9ce1c76a6c390233d8ec934cfb34bc35215", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.8940517247880146, "ground_truth": 0}, {"key": "99ec57979392a7f9c1a24158d5e1262cdf113f45", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.901227405001978, "ground_truth": 0}, {"key": "99ec57979392a7f9c1a24158d5e1262cdf113f45", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.8529354796373558, "ground_truth": 0}, {"key": "99ec57979392a7f9c1a24158d5e1262cdf113f45", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.8044059168668128, "ground_truth": 0}, {"key": "99ec57979392a7f9c1a24158d5e1262cdf113f45", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.8879840441147064, "ground_truth": 0}, {"key": "99ec57979392a7f9c1a24158d5e1262cdf113f45", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.9425067206715263, "ground_truth": 0}, {"key": "ca5c0c816376354b82a4a7b9fa9a31b655e2d2cd", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.842863146479513, "ground_truth": 0}, {"key": "ca5c0c816376354b82a4a7b9fa9a31b655e2d2cd", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.7826624882178858, "ground_truth": 0}, {"key": "ca5c0c816376354b82a4a7b9fa9a31b655e2d2cd", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.7416740241679708, "ground_truth": 0}, {"key": "ca5c0c816376354b82a4a7b9fa9a31b655e2d2cd", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.8175744809912666, "ground_truth": 0}, {"key": "ca5c0c816376354b82a4a7b9fa9a31b655e2d2cd", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.8397339600088765, "ground_truth": 0}, {"key": "e9787bf9462b12b7dfc0b562510a551e7d07b4d7", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.6513548509975886, "ground_truth": 0}, {"key": "e9787bf9462b12b7dfc0b562510a551e7d07b4d7", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.8006920158518407, "ground_truth": 0}, {"key": "e9787bf9462b12b7dfc0b562510a551e7d07b4d7", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.8187367988306413, "ground_truth": 0}, {"key": "e9787bf9462b12b7dfc0b562510a551e7d07b4d7", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.8104788971873235, "ground_truth": 0}, {"key": "e9787bf9462b12b7dfc0b562510a551e7d07b4d7", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.888758795329324, "ground_truth": 0}, {"key": "ed8a7d5b06b4b5415725e624a15ab5ada7146894", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.9329437156002163, "ground_truth": 0}, {"key": "ed8a7d5b06b4b5415725e624a15ab5ada7146894", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.9453993951907751, "ground_truth": 0}, {"key": "ed8a7d5b06b4b5415725e624a15ab5ada7146894", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.9645892734004565, "ground_truth": 0}, {"key": "ed8a7d5b06b4b5415725e624a15ab5ada7146894", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.9518632295954363, "ground_truth": 0}, {"key": "ed8a7d5b06b4b5415725e624a15ab5ada7146894", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.9073122215693576, "ground_truth": 0}, {"key": "4b6f2532f6bb4cf4ae341e4fb72d384ef58f0f42", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.763483764646203, "ground_truth": 0}, {"key": "4b6f2532f6bb4cf4ae341e4fb72d384ef58f0f42", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.9390248152944303, "ground_truth": 0}, {"key": "4b6f2532f6bb4cf4ae341e4fb72d384ef58f0f42", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.9111797144394874, "ground_truth": 0}, {"key": "4b6f2532f6bb4cf4ae341e4fb72d384ef58f0f42", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.9178933749070451, "ground_truth": 0}, {"key": "4b6f2532f6bb4cf4ae341e4fb72d384ef58f0f42", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.7905303155515214, "ground_truth": 0}, {"key": "46102a68e2927f930c1c2bd117ca714d188cd1ab", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.6584175160462339, "ground_truth": 0}, {"key": "46102a68e2927f930c1c2bd117ca714d188cd1ab", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.6909762940867773, "ground_truth": 0}, {"key": "46102a68e2927f930c1c2bd117ca714d188cd1ab", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.7341195272186267, "ground_truth": 0}, {"key": "46102a68e2927f930c1c2bd117ca714d188cd1ab", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.6774740546478232, "ground_truth": 0}, {"key": "46102a68e2927f930c1c2bd117ca714d188cd1ab", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.7185943828865559, "ground_truth": 0}, {"key": "ee6568a8880e61a498aab80c41f70939d567c991", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.7690802513583842, "ground_truth": 0}, {"key": "ee6568a8880e61a498aab80c41f70939d567c991", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.8333245983976041, "ground_truth": 0}, {"key": "ee6568a8880e61a498aab80c41f70939d567c991", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.7866228358667846, "ground_truth": 0}, {"key": "ee6568a8880e61a498aab80c41f70939d567c991", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.7943849703354786, "ground_truth": 0}, {"key": "ee6568a8880e61a498aab80c41f70939d567c991", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.8376199744580121, "ground_truth": 0}, {"key": "8f462be265750ebbf85a6ad8ef28cb39c59f826e", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.7201715051791893, "ground_truth": 0}, {"key": "8f462be265750ebbf85a6ad8ef28cb39c59f826e", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.85871859207161, "ground_truth": 0}, {"key": "8f462be265750ebbf85a6ad8ef28cb39c59f826e", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.7170118778596841, "ground_truth": 0}, {"key": "8f462be265750ebbf85a6ad8ef28cb39c59f826e", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.821044120604848, "ground_truth": 0}, {"key": "8f462be265750ebbf85a6ad8ef28cb39c59f826e", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.7759445515186968, "ground_truth": 0}, {"key": "b21258342db561f79656c3c75f2e8c8244dd6178", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.9314625048811812, "ground_truth": 0}, {"key": "b21258342db561f79656c3c75f2e8c8244dd6178", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.927363290398778, "ground_truth": 0}, {"key": "b21258342db561f79656c3c75f2e8c8244dd6178", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.8210441005279141, "ground_truth": 0}, {"key": "b21258342db561f79656c3c75f2e8c8244dd6178", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.8679338404864292, "ground_truth": 0}, {"key": "b21258342db561f79656c3c75f2e8c8244dd6178", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.9420819156578734, "ground_truth": 0}, {"key": "c7b97c7c2ca7b9bedff4978dd3cae9aaef8f8100", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.7826624831543221, "ground_truth": 0}, {"key": "c7b97c7c2ca7b9bedff4978dd3cae9aaef8f8100", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.624293520469339, "ground_truth": 0}, {"key": "c7b97c7c2ca7b9bedff4978dd3cae9aaef8f8100", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.8056322007127822, "ground_truth": 0}, {"key": "c7b97c7c2ca7b9bedff4978dd3cae9aaef8f8100", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.7648916249278491, "ground_truth": 0}, {"key": "c7b97c7c2ca7b9bedff4978dd3cae9aaef8f8100", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.8187367934490238, "ground_truth": 0}, {"key": "bdbeb9265050f2a4ce200c3802775694b7dc20e6", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.7745833677254792, "ground_truth": 0}, {"key": "bdbeb9265050f2a4ce200c3802775694b7dc20e6", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.7994423188513964, "ground_truth": 0}, {"key": "bdbeb9265050f2a4ce200c3802775694b7dc20e6", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.7918210836645927, "ground_truth": 0}, {"key": "bdbeb9265050f2a4ce200c3802775694b7dc20e6", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.7534666556275165, "ground_truth": 0}, {"key": "bdbeb9265050f2a4ce200c3802775694b7dc20e6", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.7356416332364567, "ground_truth": 0}, {"key": "42e93d5aef7547b8169f1f6c7735d0265a030580", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.8019358154050075, "ground_truth": 0}, {"key": "42e93d5aef7547b8169f1f6c7735d0265a030580", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.7490872152746532, "ground_truth": 0}, {"key": "42e93d5aef7547b8169f1f6c7735d0265a030580", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.7217432002045269, "ground_truth": 0}, {"key": "42e93d5aef7547b8169f1f6c7735d0265a030580", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.7008947947198577, "ground_truth": 0}, {"key": "42e93d5aef7547b8169f1f6c7735d0265a030580", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.6774740221765089, "ground_truth": 0}, {"key": "6e7a607934780f0011aa4e84509314efe15c2685", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.6242935030221709, "ground_truth": 0}, {"key": "6e7a607934780f0011aa4e84509314efe15c2685", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.7295197798793784, "ground_truth": 0}, {"key": "6e7a607934780f0011aa4e84509314efe15c2685", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.665410557584807, "ground_truth": 0}, {"key": "6e7a607934780f0011aa4e84509314efe15c2685", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.6791786832700712, "ground_truth": 0}, {"key": "6e7a607934780f0011aa4e84509314efe15c2685", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.5926665753312922, "ground_truth": 0}, {"key": "c087e2af172aed145b177c9a1a68029205bc732a", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.8774767887919699, "ground_truth": 0}, {"key": "c087e2af172aed145b177c9a1a68029205bc732a", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.8910549546378609, "ground_truth": 0}, {"key": "c087e2af172aed145b177c9a1a68029205bc732a", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.8856314772194465, "ground_truth": 0}, {"key": "c087e2af172aed145b177c9a1a68029205bc732a", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.8365545711191819, "ground_truth": 0}, {"key": "c087e2af172aed145b177c9a1a68029205bc732a", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.8824278671224983, "ground_truth": 0}, {"key": "40e79de5b7a27d7161b147725936d1d47e45c8f9", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.8469578408445808, "ground_truth": 0}, {"key": "40e79de5b7a27d7161b147725936d1d47e45c8f9", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.8679338510415707, "ground_truth": 0}, {"key": "40e79de5b7a27d7161b147725936d1d47e45c8f9", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.9019206855169, "ground_truth": 0}, {"key": "40e79de5b7a27d7161b147725936d1d47e45c8f9", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.8615382074226551, "ground_truth": 0}, {"key": "40e79de5b7a27d7161b147725936d1d47e45c8f9", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.8092759833599422, "ground_truth": 0}, {"key": "e878909ace599352d3d578796968bbd52cb299bd", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.6723317149552109, "ground_truth": 0}, {"key": "e878909ace599352d3d578796968bbd52cb299bd", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.675764630711824, "ground_truth": 0}, {"key": "e878909ace599352d3d578796968bbd52cb299bd", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.6893056433702949, "ground_truth": 0}, {"key": "e878909ace599352d3d578796968bbd52cb299bd", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.7201715201194931, "ground_truth": 0}, {"key": "e878909ace599352d3d578796968bbd52cb299bd", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.7662936571118767, "ground_truth": 0}, {"key": "470708aab0fe600a27423bf4a2f8c9860fe5f64b", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.7826624951331231, "ground_truth": 0}, {"key": "470708aab0fe600a27423bf4a2f8c9860fe5f64b", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.9012274075978673, "ground_truth": 0}, {"key": "470708aab0fe600a27423bf4a2f8c9860fe5f64b", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.8031737856196289, "ground_truth": 0}, {"key": "470708aab0fe600a27423bf4a2f8c9860fe5f64b", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.6757646108864064, "ground_truth": 0}, {"key": "470708aab0fe600a27423bf4a2f8c9860fe5f64b", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.7325918307021954, "ground_truth": 0}, {"key": "16e8cb520c874af6825d4661f6127a67efd4b6f6", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.8723473775345831, "ground_truth": 0}, {"key": "16e8cb520c874af6825d4661f6127a67efd4b6f6", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.908617897178584, "ground_truth": 0}, {"key": "16e8cb520c874af6825d4661f6127a67efd4b6f6", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.8267117964319854, "ground_truth": 0}, {"key": "16e8cb520c874af6825d4661f6127a67efd4b6f6", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.8661325094502184, "ground_truth": 0}, {"key": "16e8cb520c874af6825d4661f6127a67efd4b6f6", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.8910549583813603, "ground_truth": 0}, {"key": "38673348ff28676905791fe3e8db2bbda814d974", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.7799929032812468, "ground_truth": 0}, {"key": "38673348ff28676905791fe3e8db2bbda814d974", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.8267117951133947, "ground_truth": 0}, {"key": "38673348ff28676905791fe3e8db2bbda814d974", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.7905303091902675, "ground_truth": 0}, {"key": "38673348ff28676905791fe3e8db2bbda814d974", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.8606036198822302, "ground_truth": 0}, {"key": "38673348ff28676905791fe3e8db2bbda814d974", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.7201714923549764, "ground_truth": 0}, {"key": "914a0163e25ecccb635b601837cc4dd552c66ce0", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.697608924064507, "ground_truth": 0}, {"key": "914a0163e25ecccb635b601837cc4dd552c66ce0", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.6992544552801061, "ground_truth": 0}, {"key": "914a0163e25ecccb635b601837cc4dd552c66ce0", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.6334102625980456, "ground_truth": 0}, {"key": "914a0163e25ecccb635b601837cc4dd552c66ce0", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.5428632937495337, "ground_truth": 0}, {"key": "914a0163e25ecccb635b601837cc4dd552c66ce0", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.746139000131289, "ground_truth": 0}, {"key": "851c7314af56b6f47742970e11696948323dfe94", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.8278281487015727, "ground_truth": 0}, {"key": "851c7314af56b6f47742970e11696948323dfe94", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.9334308108735281, "ground_truth": 0}, {"key": "851c7314af56b6f47742970e11696948323dfe94", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.8596637497356122, "ground_truth": 0}, {"key": "851c7314af56b6f47742970e11696948323dfe94", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.8255897173274435, "ground_truth": 0}, {"key": "851c7314af56b6f47742970e11696948323dfe94", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.8933094052147538, "ground_truth": 0}, {"key": "f29f04e8f0615b768dd756c4387e87e27b7b4c2d", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.8670357546153254, "ground_truth": 0}, {"key": "f29f04e8f0615b768dd756c4387e87e27b7b4c2d", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.8092759790487248, "ground_truth": 0}, {"key": "f29f04e8f0615b768dd756c4387e87e27b7b4c2d", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.8947894675300955, "ground_truth": 0}, {"key": "f29f04e8f0615b768dd756c4387e87e27b7b4c2d", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.7416740195679262, "ground_truth": 0}, {"key": "f29f04e8f0615b768dd756c4387e87e27b7b4c2d", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.7718435006089748, "ground_truth": 0}, {"key": "8451164e86012e6dbf2fd39f7e6ca784ff9f3624", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.7969253713135276, "ground_truth": 0}, {"key": "8451164e86012e6dbf2fd39f7e6ca784ff9f3624", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.8910549472467398, "ground_truth": 0}, {"key": "8451164e86012e6dbf2fd39f7e6ca784ff9f3624", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.8652240959780136, "ground_truth": 0}, {"key": "8451164e86012e6dbf2fd39f7e6ca784ff9f3624", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.8577681022934532, "ground_truth": 0}, {"key": "8451164e86012e6dbf2fd39f7e6ca784ff9f3624", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.9032942095872286, "ground_truth": 0}, {"key": "18765fda59852b1c13eb226a2da9ab0979739f44", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.8244619332899875, "ground_truth": 0}, {"key": "18765fda59852b1c13eb226a2da9ab0979739f44", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.7799929148672307, "ground_truth": 0}, {"key": "18765fda59852b1c13eb226a2da9ab0979739f44", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.796925374673746, "ground_truth": 0}, {"key": "18765fda59852b1c13eb226a2da9ab0979739f44", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.8376199736859096, "ground_truth": 0}, {"key": "18765fda59852b1c13eb226a2da9ab0979739f44", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.8198933359043776, "ground_truth": 0}, {"key": "fba410776268aaf447802e66ac94e4af54f7cb7a", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.9742394378371735, "ground_truth": 0}, {"key": "fba410776268aaf447802e66ac94e4af54f7cb7a", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.9674102576577516, "ground_truth": 0}, {"key": "fba410776268aaf447802e66ac94e4af54f7cb7a", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.9790357600344952, "ground_truth": 0}, {"key": "fba410776268aaf447802e66ac94e4af54f7cb7a", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.9671630461239697, "ground_truth": 0}, {"key": "fba410776268aaf447802e66ac94e4af54f7cb7a", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.9566341979802043, "ground_truth": 0}, {"key": "31494e5d6eda2042c4793ae68cea4b8304dfa0ad", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.9343951677210977, "ground_truth": 0}, {"key": "31494e5d6eda2042c4793ae68cea4b8304dfa0ad", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.9496693708531304, "ground_truth": 0}, {"key": "31494e5d6eda2042c4793ae68cea4b8304dfa0ad", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.9566342012909046, "ground_truth": 0}, {"key": "31494e5d6eda2042c4793ae68cea4b8304dfa0ad", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.9653811618562925, "ground_truth": 0}, {"key": "31494e5d6eda2042c4793ae68cea4b8304dfa0ad", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.968141144159062, "ground_truth": 0}, {"key": "564bdb9bbcd2276bdfbdce6eb1e2058f0921bd82", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.8783142510311096, "ground_truth": 0}, {"key": "564bdb9bbcd2276bdfbdce6eb1e2058f0921bd82", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.8732148411468005, "ground_truth": 0}, {"key": "564bdb9bbcd2276bdfbdce6eb1e2058f0921bd82", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.8872045928575696, "ground_truth": 0}, {"key": "564bdb9bbcd2276bdfbdce6eb1e2058f0921bd82", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.8933094061970566, "ground_truth": 0}, {"key": "564bdb9bbcd2276bdfbdce6eb1e2058f0921bd82", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.9309620782178083, "ground_truth": 0}, {"key": "acbacec078274c02aeae06061357d02d950fec33", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.8740772228474475, "ground_truth": 0}, {"key": "acbacec078274c02aeae06061357d02d950fec33", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.8289388023067328, "ground_truth": 0}, {"key": "acbacec078274c02aeae06061357d02d950fec33", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.8116760361981364, "ground_truth": 0}, {"key": "acbacec078274c02aeae06061357d02d950fec33", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.7879312042946273, "ground_truth": 0}, {"key": "acbacec078274c02aeae06061357d02d950fec33", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.8068526258617614, "ground_truth": 0}, {"key": "04327bc3e426eee01ed61d369fd52415aa300ddc", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.8947894661814898, "ground_truth": 0}, {"key": "04327bc3e426eee01ed61d369fd52415aa300ddc", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.8244619279955138, "ground_truth": 0}, {"key": "04327bc3e426eee01ed61d369fd52415aa300ddc", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.9005297802907143, "ground_truth": 0}, {"key": "04327bc3e426eee01ed61d369fd52415aa300ddc", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.8418256430157708, "ground_truth": 0}, {"key": "04327bc3e426eee01ed61d369fd52415aa300ddc", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.8587185899820774, "ground_truth": 0}, {"key": "b1f3d2adb48370e5ecadff8e6e3baff407b01f0e", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.9314625064942931, "ground_truth": 0}, {"key": "b1f3d2adb48370e5ecadff8e6e3baff407b01f0e", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.8940517226267386, "ground_truth": 0}, {"key": "b1f3d2adb48370e5ecadff8e6e3baff407b01f0e", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.8799743704986548, "ground_truth": 0}, {"key": "b1f3d2adb48370e5ecadff8e6e3baff407b01f0e", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.9492946378329444, "ground_truth": 0}, {"key": "b1f3d2adb48370e5ecadff8e6e3baff407b01f0e", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.8300437639212067, "ground_truth": 0}, {"key": "d7eaf2e5ca91bf54c05ead867e5e90728d44e218", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.9213576192716548, "ground_truth": 0}, {"key": "d7eaf2e5ca91bf54c05ead867e5e90728d44e218", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.9458012691783666, "ground_truth": 0}, {"key": "d7eaf2e5ca91bf54c05ead867e5e90728d44e218", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.9618217231327281, "ground_truth": 0}, {"key": "d7eaf2e5ca91bf54c05ead867e5e90728d44e218", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.9118099537890375, "ground_truth": 0}, {"key": "d7eaf2e5ca91bf54c05ead867e5e90728d44e218", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.9416541606554609, "ground_truth": 0}, {"key": "1fcce9f667de2a14d76aaa6cdb3f1e6f7900e463", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.9695556511342482, "ground_truth": 0}, {"key": "1fcce9f667de2a14d76aaa6cdb3f1e6f7900e463", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.9728307665645199, "ground_truth": 0}, {"key": "1fcce9f667de2a14d76aaa6cdb3f1e6f7900e463", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.9645892703302638, "ground_truth": 0}, {"key": "1fcce9f667de2a14d76aaa6cdb3f1e6f7900e463", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.962391364887564, "ground_truth": 0}, {"key": "1fcce9f667de2a14d76aaa6cdb3f1e6f7900e463", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.9704646633895642, "ground_truth": 0}, {"key": "892f75a4d31560b60aa588faa6f4bf51322b8c18", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.926835279742003, "ground_truth": 0}, {"key": "892f75a4d31560b60aa588faa6f4bf51322b8c18", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.9190632958584384, "ground_truth": 0}, {"key": "892f75a4d31560b60aa588faa6f4bf51322b8c18", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.9367494787044226, "ground_truth": 0}, {"key": "892f75a4d31560b60aa588faa6f4bf51322b8c18", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.8344068975284645, "ground_truth": 0}, {"key": "892f75a4d31560b60aa588faa6f4bf51322b8c18", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.8031738029275676, "ground_truth": 0}, {"key": "acf12bd8d1142648b1b522a3a925e14e48b8f068", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.8469578564936204, "ground_truth": 0}, {"key": "acf12bd8d1142648b1b522a3a925e14e48b8f068", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.8740772410929459, "ground_truth": 0}, {"key": "acf12bd8d1142648b1b522a3a925e14e48b8f068", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.7866228208345911, "ground_truth": 0}, {"key": "acf12bd8d1142648b1b522a3a925e14e48b8f068", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.8267117939496916, "ground_truth": 0}, {"key": "acf12bd8d1142648b1b522a3a925e14e48b8f068", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.8267117839817847, "ground_truth": 0}, {"key": "c8caeb08b05cc56e1ac29146793ceb07e4c0de69", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.9572777998591977, "ground_truth": 0}, {"key": "c8caeb08b05cc56e1ac29146793ceb07e4c0de69", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.9178933710263332, "ground_truth": 0}, {"key": "c8caeb08b05cc56e1ac29146793ceb07e4c0de69", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.8918110494057945, "ground_truth": 0}, {"key": "c8caeb08b05cc56e1ac29146793ceb07e4c0de69", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.9529258225864831, "ground_truth": 0}, {"key": "c8caeb08b05cc56e1ac29146793ceb07e4c0de69", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.9099070023374628, "ground_truth": 0}, {"key": "ed7ed4440f5f7082230ae745d240350a4f20b8b7", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.8187367901230606, "ground_truth": 0}, {"key": "ed7ed4440f5f7082230ae745d240350a4f20b8b7", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.8418256467174854, "ground_truth": 0}, {"key": "ed7ed4440f5f7082230ae745d240350a4f20b8b7", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.8887587933358363, "ground_truth": 0}, {"key": "ed7ed4440f5f7082230ae745d240350a4f20b8b7", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.8092759702053645, "ground_truth": 0}, {"key": "ed7ed4440f5f7082230ae745d240350a4f20b8b7", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.8031737855865493, "ground_truth": 0}, {"key": "25b7adf8bfe43c2953a874b18c7766370158638a", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.8509647119280134, "ground_truth": 0}, {"key": "25b7adf8bfe43c2953a874b18c7766370158638a", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.7634837734697338, "ground_truth": 0}, {"key": "25b7adf8bfe43c2953a874b18c7766370158638a", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.7839884723971405, "ground_truth": 0}, {"key": "25b7adf8bfe43c2953a874b18c7766370158638a", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.8333245868863232, "ground_truth": 0}, {"key": "25b7adf8bfe43c2953a874b18c7766370158638a", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.9005297918290961, "ground_truth": 0}, {"key": "771c125e3b0c54f1c3367b2857f15d689f081163", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.925229953162914, "ground_truth": 0}, {"key": "771c125e3b0c54f1c3367b2857f15d689f081163", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.8749346189842286, "ground_truth": 0}, {"key": "771c125e3b0c54f1c3367b2857f15d689f081163", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.911809953325718, "ground_truth": 0}, {"key": "771c125e3b0c54f1c3367b2857f15d689f081163", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.9381240181476723, "ground_truth": 0}, {"key": "771c125e3b0c54f1c3367b2857f15d689f081163", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.894789468701788, "ground_truth": 0}, {"key": "4ad70f84c363e5b594da00983e2b40600f12ca54", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.9026095987423959, "ground_truth": 0}, {"key": "4ad70f84c363e5b594da00983e2b40600f12ca54", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.8976952993142165, "ground_truth": 0}, {"key": "4ad70f84c363e5b594da00983e2b40600f12ca54", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.9019206742850042, "ground_truth": 0}, {"key": "4ad70f84c363e5b594da00983e2b40600f12ca54", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.908617896841046, "ground_truth": 0}, {"key": "4ad70f84c363e5b594da00983e2b40600f12ca54", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.9019206834165397, "ground_truth": 0}, {"key": "cbb5654e979eb27e0af71068cd4e4e5191df35ee", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.7279754454546522, "ground_truth": 0}, {"key": "cbb5654e979eb27e0af71068cd4e4e5191df35ee", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.8244619265466437, "ground_truth": 0}, {"key": "cbb5654e979eb27e0af71068cd4e4e5191df35ee", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.8006920185099369, "ground_truth": 0}, {"key": "cbb5654e979eb27e0af71068cd4e4e5191df35ee", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.7386690802427847, "ground_truth": 0}, {"key": "cbb5654e979eb27e0af71068cd4e4e5191df35ee", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.8210441131197127, "ground_truth": 0}, {"key": "bde6b7e505c05a15a9afe44739e7f016ce169735", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.5869964345048408, "ground_truth": 0}, {"key": "bde6b7e505c05a15a9afe44739e7f016ce169735", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.6909762767036635, "ground_truth": 0}, {"key": "bde6b7e505c05a15a9afe44739e7f016ce169735", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.7606506569643259, "ground_truth": 0}, {"key": "bde6b7e505c05a15a9afe44739e7f016ce169735", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.4205995770193464, "ground_truth": 0}, {"key": "bde6b7e505c05a15a9afe44739e7f016ce169735", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.7233094820218972, "ground_truth": 0}, {"key": "abc4744227c6bf0ddbf64cac2269bd4c6d02938b", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.642432492106091, "ground_truth": 0}, {"key": "abc4744227c6bf0ddbf64cac2269bd4c6d02938b", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.8233283928624842, "ground_truth": 0}, {"key": "abc4744227c6bf0ddbf64cac2269bd4c6d02938b", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.6242935326060277, "ground_truth": 0}, {"key": "abc4744227c6bf0ddbf64cac2269bd4c6d02938b", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.6132365677044332, "ground_truth": 0}, {"key": "abc4744227c6bf0ddbf64cac2269bd4c6d02938b", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.6723317032649878, "ground_truth": 0}, {"key": "f7e5e75031e9f099564ed046bd822ef1bedb3188", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.8376199740447325, "ground_truth": 0}, {"key": "f7e5e75031e9f099564ed046bd822ef1bedb3188", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.86246753443444, "ground_truth": 0}, {"key": "f7e5e75031e9f099564ed046bd822ef1bedb3188", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.8244619361388842, "ground_truth": 0}, {"key": "f7e5e75031e9f099564ed046bd822ef1bedb3188", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.7943849441001697, "ground_truth": 0}, {"key": "f7e5e75031e9f099564ed046bd822ef1bedb3188", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.8164063701782132, "ground_truth": 0}, {"key": "9a8ee7eb582f293c617eecab5f37374d9400bb04", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.7264256081428349, "ground_truth": 0}, {"key": "9a8ee7eb582f293c617eecab5f37374d9400bb04", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.5851011428209776, "ground_truth": 0}, {"key": "9a8ee7eb582f293c617eecab5f37374d9400bb04", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.7090191266726743, "ground_truth": 0}, {"key": "9a8ee7eb582f293c617eecab5f37374d9400bb04", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.5389831935219752, "ground_truth": 0}, {"key": "9a8ee7eb582f293c617eecab5f37374d9400bb04", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.5428632915113398, "ground_truth": 0}, {"key": "a745e5a95be983cde00f3d472062c0627db3113c", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.8940517154363362, "ground_truth": 0}, {"key": "a745e5a95be983cde00f3d472062c0627db3113c", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.8587185825951075, "ground_truth": 0}, {"key": "a745e5a95be983cde00f3d472062c0627db3113c", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.7994423376081067, "ground_truth": 0}, {"key": "a745e5a95be983cde00f3d472062c0627db3113c", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.866132493681832, "ground_truth": 0}, {"key": "a745e5a95be983cde00f3d472062c0627db3113c", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.7295197907213288, "ground_truth": 0}, {"key": "698cdb1268d4da1240d7f540bd4a5af4e229d00f", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.8418256499878469, "ground_truth": 0}, {"key": "698cdb1268d4da1240d7f540bd4a5af4e229d00f", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.8832359927327829, "ground_truth": 0}, {"key": "698cdb1268d4da1240d7f540bd4a5af4e229d00f", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.7943849711203467, "ground_truth": 0}, {"key": "698cdb1268d4da1240d7f540bd4a5af4e229d00f", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.6959583222579186, "ground_truth": 0}, {"key": "698cdb1268d4da1240d7f540bd4a5af4e229d00f", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.8068526211398616, "ground_truth": 0}, {"key": "708c903fbf6a7c3c84f84ff34496eb0cb51f44e4", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.8596637455758629, "ground_truth": 0}, {"key": "708c903fbf6a7c3c84f84ff34496eb0cb51f44e4", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.8643104656481998, "ground_truth": 0}, {"key": "708c903fbf6a7c3c84f84ff34496eb0cb51f44e4", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.9039745067782761, "ground_truth": 0}, {"key": "708c903fbf6a7c3c84f84ff34496eb0cb51f44e4", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.8187367938210711, "ground_truth": 0}, {"key": "708c903fbf6a7c3c84f84ff34496eb0cb51f44e4", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.8558511428423002, "ground_truth": 0}, {"key": "26a1bafbde5cc970d5aee024dc8ef418587018a9", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.8449215316873714, "ground_truth": 0}, {"key": "26a1bafbde5cc970d5aee024dc8ef418587018a9", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.8824278591854793, "ground_truth": 0}, {"key": "26a1bafbde5cc970d5aee024dc8ef418587018a9", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.8757869898062411, "ground_truth": 0}, {"key": "26a1bafbde5cc970d5aee024dc8ef418587018a9", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.818736802526613, "ground_truth": 0}, {"key": "26a1bafbde5cc970d5aee024dc8ef418587018a9", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.9099070042004813, "ground_truth": 0}, {"key": "6832312991fe5d87d0e300374ec7a699a921f06a", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.8104789053448567, "ground_truth": 0}, {"key": "6832312991fe5d87d0e300374ec7a699a921f06a", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.8397339631233915, "ground_truth": 0}, {"key": "6832312991fe5d87d0e300374ec7a699a921f06a", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.6706082827717416, "ground_truth": 0}, {"key": "6832312991fe5d87d0e300374ec7a699a921f06a", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.6723317025090843, "ground_truth": 0}, {"key": "6832312991fe5d87d0e300374ec7a699a921f06a", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.8940517200853768, "ground_truth": 0}, {"key": "9c5d5d672c2549a594b801897a27dde1492e11d5", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.9394706094049413, "ground_truth": 0}, {"key": "9c5d5d672c2549a594b801897a27dde1492e11d5", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.9190632874777657, "ground_truth": 0}, {"key": "9c5d5d672c2549a594b801897a27dde1492e11d5", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.9420819118500163, "ground_truth": 0}, {"key": "9c5d5d672c2549a594b801897a27dde1492e11d5", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.9496693683684286, "ground_truth": 0}, {"key": "9c5d5d672c2549a594b801897a27dde1492e11d5", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.9629528320790486, "ground_truth": 0}, {"key": "c32fa9084fe8cd565890a940794e505d5f7ba4c2", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.887204589463761, "ground_truth": 0}, {"key": "c32fa9084fe8cd565890a940794e505d5f7ba4c2", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.7217432084090389, "ground_truth": 0}, {"key": "c32fa9084fe8cd565890a940794e505d5f7ba4c2", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.7879312045144529, "ground_truth": 0}, {"key": "c32fa9084fe8cd565890a940794e505d5f7ba4c2", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.8311430513318184, "ground_truth": 0}, {"key": "c32fa9084fe8cd565890a940794e505d5f7ba4c2", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.7813306412452956, "ground_truth": 0}, {"key": "41b5dd6064864c16fbde9b46d37c9f7d9a56e705", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.8152324922917531, "ground_truth": 0}, {"key": "41b5dd6064864c16fbde9b46d37c9f7d9a56e705", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.8679338345594232, "ground_truth": 0}, {"key": "41b5dd6064864c16fbde9b46d37c9f7d9a56e705", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.7994423104758783, "ground_truth": 0}, {"key": "41b5dd6064864c16fbde9b46d37c9f7d9a56e705", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.7606506671514721, "ground_truth": 0}, {"key": "41b5dd6064864c16fbde9b46d37c9f7d9a56e705", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.7634837429277772, "ground_truth": 0}, {"key": "b2d3ba739af767da7aa25c3ba8e1d186168c3394", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.9603611590299185, "ground_truth": 0}, {"key": "b2d3ba739af767da7aa25c3ba8e1d186168c3394", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.9224823395607601, "ground_truth": 0}, {"key": "b2d3ba739af767da7aa25c3ba8e1d186168c3394", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.9039745082310092, "ground_truth": 0}, {"key": "b2d3ba739af767da7aa25c3ba8e1d186168c3394", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.90796713693091, "ground_truth": 0}, {"key": "b2d3ba739af767da7aa25c3ba8e1d186168c3394", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.9161096189958094, "ground_truth": 0}, {"key": "519fd9b5c5ca82979cdfee3c990c3590838d93c7", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.8548846382256162, "ground_truth": 0}, {"key": "519fd9b5c5ca82979cdfee3c990c3590838d93c7", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.8519528103441064, "ground_truth": 0}, {"key": "519fd9b5c5ca82979cdfee3c990c3590838d93c7", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.6150878346914166, "ground_truth": 0}, {"key": "519fd9b5c5ca82979cdfee3c990c3590838d93c7", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.7676898581179424, "ground_truth": 0}, {"key": "519fd9b5c5ca82979cdfee3c990c3590838d93c7", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.6992544303216763, "ground_truth": 0}, {"key": "60f518dff20b2936b104035b1fd9584dd7d16def", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.7981867601122495, "ground_truth": 0}, {"key": "60f518dff20b2936b104035b1fd9584dd7d16def", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.7905303117204856, "ground_truth": 0}, {"key": "60f518dff20b2936b104035b1fd9584dd7d16def", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.7057850354641705, "ground_truth": 0}, {"key": "60f518dff20b2936b104035b1fd9584dd7d16def", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.6334102350325832, "ground_truth": 0}, {"key": "60f518dff20b2936b104035b1fd9584dd7d16def", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.7490872174675909, "ground_truth": 0}, {"key": "b82546b760716f0a2b26606b07af0fe0dd61d6ff", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.9348724522342554, "ground_truth": 0}, {"key": "b82546b760716f0a2b26606b07af0fe0dd61d6ff", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.855851138676003, "ground_truth": 0}, {"key": "b82546b760716f0a2b26606b07af0fe0dd61d6ff", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.8732148305912102, "ground_truth": 0}, {"key": "b82546b760716f0a2b26606b07af0fe0dd61d6ff", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.8714748605866901, "ground_truth": 0}, {"key": "b82546b760716f0a2b26606b07af0fe0dd61d6ff", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.9213576183145268, "ground_truth": 0}, {"key": "7990fde4a924299fab79f6c8e2b447ee5ffcd1fc", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.7534666458777043, "ground_truth": 0}, {"key": "7990fde4a924299fab79f6c8e2b447ee5ffcd1fc", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.7534666588929647, "ground_truth": 0}, {"key": "7990fde4a924299fab79f6c8e2b447ee5ffcd1fc", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.45519859587967176, "ground_truth": 0}, {"key": "7990fde4a924299fab79f6c8e2b447ee5ffcd1fc", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.783988472658768, "ground_truth": 0}, {"key": "7990fde4a924299fab79f6c8e2b447ee5ffcd1fc", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.7879311924213603, "ground_truth": 0}, {"key": "504f6f6e1aea6bb73c728d12a1342faa6828aace", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.9949788501807956, "ground_truth": 0}, {"key": "504f6f6e1aea6bb73c728d12a1342faa6828aace", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.9952448002291698, "ground_truth": 0}, {"key": "504f6f6e1aea6bb73c728d12a1342faa6828aace", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.9918752904388264, "ground_truth": 0}, {"key": "504f6f6e1aea6bb73c728d12a1342faa6828aace", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.9902915236871052, "ground_truth": 0}, {"key": "504f6f6e1aea6bb73c728d12a1342faa6828aace", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.992654173481189, "ground_truth": 0}, {"key": "ef42653bf9337de184e74be0160b807a41b526fd", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.9853843294096979, "ground_truth": 0}, {"key": "ef42653bf9337de184e74be0160b807a41b526fd", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.9932550102953687, "ground_truth": 0}, {"key": "ef42653bf9337de184e74be0160b807a41b526fd", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.9875683487134526, "ground_truth": 0}, {"key": "ef42653bf9337de184e74be0160b807a41b526fd", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.9842154384538538, "ground_truth": 0}, {"key": "ef42653bf9337de184e74be0160b807a41b526fd", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.9922444630716336, "ground_truth": 0}, {"key": "26d0a5624f3ee7605833c641da5d88e2259b1162", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.9314625092033914, "ground_truth": 0}, {"key": "26d0a5624f3ee7605833c641da5d88e2259b1162", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.9086178892277446, "ground_truth": 0}, {"key": "26d0a5624f3ee7605833c641da5d88e2259b1162", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.9425067238607269, "ground_truth": 0}, {"key": "26d0a5624f3ee7605833c641da5d88e2259b1162", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.8679338526333717, "ground_truth": 0}, {"key": "26d0a5624f3ee7605833c641da5d88e2259b1162", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.9039745102663977, "ground_truth": 0}, {"key": "7e43e9a2c67829721ff9f68147285c579e2c8a70", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.5467381422149593, "ground_truth": 0}, {"key": "7e43e9a2c67829721ff9f68147285c579e2c8a70", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.718594395040822, "ground_truth": 0}, {"key": "7e43e9a2c67829721ff9f68147285c579e2c8a70", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.519521308536923, "ground_truth": 0}, {"key": "7e43e9a2c67829721ff9f68147285c579e2c8a70", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.5136684554899968, "ground_truth": 0}, {"key": "7e43e9a2c67829721ff9f68147285c579e2c8a70", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.616935848708407, "ground_truth": 0}, {"key": "2137ee3e39b5c0d12e17bbd1e10eb75495a3a83b", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.7008948030195362, "ground_truth": 0}, {"key": "2137ee3e39b5c0d12e17bbd1e10eb75495a3a83b", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.6297746290807589, "ground_truth": 0}, {"key": "2137ee3e39b5c0d12e17bbd1e10eb75495a3a83b", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.38491216158047875, "ground_truth": 0}, {"key": "2137ee3e39b5c0d12e17bbd1e10eb75495a3a83b", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.5964331280729553, "ground_truth": 0}, {"key": "2137ee3e39b5c0d12e17bbd1e10eb75495a3a83b", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.5506073668897634, "ground_truth": 0}, {"key": "31defcc44013caae59c0bdbcedd16be150413bd5", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.8175744925696578, "ground_truth": 0}, {"key": "31defcc44013caae59c0bdbcedd16be150413bd5", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.8164063970777727, "ground_truth": 0}, {"key": "31defcc44013caae59c0bdbcedd16be150413bd5", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.8278281573518549, "ground_truth": 0}, {"key": "31defcc44013caae59c0bdbcedd16be150413bd5", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.7879311900260414, "ground_truth": 0}, {"key": "31defcc44013caae59c0bdbcedd16be150413bd5", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.7201715294915578, "ground_truth": 0}, {"key": "db73dc3466e4e92672d716c1eb2ac9430ac69951", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.9348724495535639, "ground_truth": 0}, {"key": "db73dc3466e4e92672d716c1eb2ac9430ac69951", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.9623913648802986, "ground_truth": 0}, {"key": "db73dc3466e4e92672d716c1eb2ac9430ac69951", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.8902942262344423, "ground_truth": 0}, {"key": "db73dc3466e4e92672d716c1eb2ac9430ac69951", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.937210797103223, "ground_truth": 0}, {"key": "db73dc3466e4e92672d716c1eb2ac9430ac69951", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.929951038389057, "ground_truth": 0}, {"key": "3f6308f2f5b6ccdb89d7b6abe1b9490cc30b8e5f", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.8438950964993325, "ground_truth": 0}, {"key": "3f6308f2f5b6ccdb89d7b6abe1b9490cc30b8e5f", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.7416740070848994, "ground_truth": 0}, {"key": "3f6308f2f5b6ccdb89d7b6abe1b9490cc30b8e5f", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.7786493104731453, "ground_truth": 0}, {"key": "3f6308f2f5b6ccdb89d7b6abe1b9490cc30b8e5f", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.7476159629489835, "ground_truth": 0}, {"key": "3f6308f2f5b6ccdb89d7b6abe1b9490cc30b8e5f", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.704160139123303, "ground_truth": 0}, {"key": "068d37f7a1ee822245dbf9d0d8ddfc281919d7ee", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.8587185933694154, "ground_truth": 0}, {"key": "068d37f7a1ee822245dbf9d0d8ddfc281919d7ee", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.8705972694407177, "ground_truth": 0}, {"key": "068d37f7a1ee822245dbf9d0d8ddfc281919d7ee", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.8856314788134273, "ground_truth": 0}, {"key": "068d37f7a1ee822245dbf9d0d8ddfc281919d7ee", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.7662936445949693, "ground_truth": 0}, {"key": "068d37f7a1ee822245dbf9d0d8ddfc281919d7ee", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.8918110452263348, "ground_truth": 0}, {"key": "bb1e2c23f3fc6edb0ee4bed365cb5567c87a5aa9", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.8311430556557968, "ground_truth": 0}, {"key": "bb1e2c23f3fc6edb0ee4bed365cb5567c87a5aa9", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.6495786343338621, "ground_truth": 0}, {"key": "bb1e2c23f3fc6edb0ee4bed365cb5567c87a5aa9", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.8606036223470876, "ground_truth": 0}, {"key": "bb1e2c23f3fc6edb0ee4bed365cb5567c87a5aa9", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.7956581061106793, "ground_truth": 0}, {"key": "bb1e2c23f3fc6edb0ee4bed365cb5567c87a5aa9", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.7879311883221491, "ground_truth": 0}, {"key": "7c72b57e65ddefc77362ed64f7dbc0aebb87ac81", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.9839708513847749, "ground_truth": 0}, {"key": "7c72b57e65ddefc77362ed64f7dbc0aebb87ac81", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.9877587241568774, "ground_truth": 0}, {"key": "7c72b57e65ddefc77362ed64f7dbc0aebb87ac81", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.9835969680674272, "ground_truth": 0}, {"key": "7c72b57e65ddefc77362ed64f7dbc0aebb87ac81", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.987178785187038, "ground_truth": 0}, {"key": "7c72b57e65ddefc77362ed64f7dbc0aebb87ac81", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.9926541740363275, "ground_truth": 0}, {"key": "37a335b36b8d2472825c4624e5449b995726b7a3", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.8333245993399921, "ground_truth": 0}, {"key": "37a335b36b8d2472825c4624e5449b995726b7a3", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.7577943721010898, "ground_truth": 0}, {"key": "37a335b36b8d2472825c4624e5449b995726b7a3", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.6442251179819017, "ground_truth": 0}, {"key": "37a335b36b8d2472825c4624e5449b995726b7a3", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.8519528107691704, "ground_truth": 0}, {"key": "37a335b36b8d2472825c4624e5449b995726b7a3", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.8116760259275552, "ground_truth": 0}, {"key": "da894eb6e5cc104f90ac65e8a124bfcfbfc6578d", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.6959583157888509, "ground_truth": 0}, {"key": "da894eb6e5cc104f90ac65e8a124bfcfbfc6578d", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.8322366544838314, "ground_truth": 0}, {"key": "da894eb6e5cc104f90ac65e8a124bfcfbfc6578d", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.6424324724815317, "ground_truth": 0}, {"key": "da894eb6e5cc104f90ac65e8a124bfcfbfc6578d", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.8044059179092841, "ground_truth": 0}, {"key": "da894eb6e5cc104f90ac65e8a124bfcfbfc6578d", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.8918110471615516, "ground_truth": 0}, {"key": "b7697e424512e656efe5f2aca17bc33cfe0a2b20", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.6513548764640011, "ground_truth": 0}, {"key": "b7697e424512e656efe5f2aca17bc33cfe0a2b20", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.6601723900385049, "ground_truth": 0}, {"key": "b7697e424512e656efe5f2aca17bc33cfe0a2b20", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.8198933396451887, "ground_truth": 0}, {"key": "b7697e424512e656efe5f2aca17bc33cfe0a2b20", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.7690802433437589, "ground_truth": 0}, {"key": "b7697e424512e656efe5f2aca17bc33cfe0a2b20", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.8006920170194408, "ground_truth": 0}, {"key": "2292d4348e59aafbe93f3040af23fdff448a6cac", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.8732148334572976, "ground_truth": 0}, {"key": "2292d4348e59aafbe93f3040af23fdff448a6cac", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.9425067266354205, "ground_truth": 0}, {"key": "2292d4348e59aafbe93f3040af23fdff448a6cac", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.9032941995151983, "ground_truth": 0}, {"key": "2292d4348e59aafbe93f3040af23fdff448a6cac", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.8267117886562031, "ground_truth": 0}, {"key": "2292d4348e59aafbe93f3040af23fdff448a6cac", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.9053223004895158, "ground_truth": 0}, {"key": "8ed7e0c5e15275537f2c1d5d945e95709d7dc6bf", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.6774740113249543, "ground_truth": 0}, {"key": "8ed7e0c5e15275537f2c1d5d945e95709d7dc6bf", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.7057850199753456, "ground_truth": 0}, {"key": "8ed7e0c5e15275537f2c1d5d945e95709d7dc6bf", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.6943026746355843, "ground_truth": 0}, {"key": "8ed7e0c5e15275537f2c1d5d945e95709d7dc6bf", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.754914989742121, "ground_truth": 0}, {"key": "8ed7e0c5e15275537f2c1d5d945e95709d7dc6bf", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.5679365944317099, "ground_truth": 0}, {"key": "6b22be31a2cefb2fdd302b8ff788335f23f5dbad", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.9012274023674588, "ground_truth": 0}, {"key": "6b22be31a2cefb2fdd302b8ff788335f23f5dbad", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.8879840425615951, "ground_truth": 0}, {"key": "6b22be31a2cefb2fdd302b8ff788335f23f5dbad", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.810478893365984, "ground_truth": 0}, {"key": "6b22be31a2cefb2fdd302b8ff788335f23f5dbad", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.8955226808268077, "ground_truth": 0}, {"key": "6b22be31a2cefb2fdd302b8ff788335f23f5dbad", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.879146770144685, "ground_truth": 0}, {"key": "686caba1039a286aca406e0bbac00aebb198fda5", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.9566342022428704, "ground_truth": 0}, {"key": "686caba1039a286aca406e0bbac00aebb198fda5", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.9458012700821323, "ground_truth": 0}, {"key": "686caba1039a286aca406e0bbac00aebb198fda5", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.8910549537908979, "ground_truth": 0}, {"key": "686caba1039a286aca406e0bbac00aebb198fda5", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.9367494767705553, "ground_truth": 0}, {"key": "686caba1039a286aca406e0bbac00aebb198fda5", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.9394706091223308, "ground_truth": 0}, {"key": "3c84e13d5941fdbe626183cdf1dca9b5df6c8f92", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.9477691422342518, "ground_truth": 0}, {"key": "3c84e13d5941fdbe626183cdf1dca9b5df6c8f92", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.9489172640535525, "ground_truth": 0}, {"key": "3c84e13d5941fdbe626183cdf1dca9b5df6c8f92", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.9136765306977332, "ground_truth": 0}, {"key": "3c84e13d5941fdbe626183cdf1dca9b5df6c8f92", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.9511422203963662, "ground_truth": 0}, {"key": "3c84e13d5941fdbe626183cdf1dca9b5df6c8f92", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.9299510338632194, "ground_truth": 0}, {"key": "7f5fd7614f32586747f65545bebba418c3679d12", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.8624675492692573, "ground_truth": 0}, {"key": "7f5fd7614f32586747f65545bebba418c3679d12", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.5525396821635994, "ground_truth": 0}, {"key": "7f5fd7614f32586747f65545bebba418c3679d12", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.709019148301738, "ground_truth": 0}, {"key": "7f5fd7614f32586747f65545bebba418c3679d12", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.6548947388146744, "ground_truth": 0}, {"key": "7f5fd7614f32586747f65545bebba418c3679d12", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.8289388115152568, "ground_truth": 0}, {"key": "186210bbc060c272ff9a2412ec2e711a3e4a5e6e", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.8749346159827286, "ground_truth": 0}, {"key": "186210bbc060c272ff9a2412ec2e711a3e4a5e6e", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.884837777575793, "ground_truth": 0}, {"key": "186210bbc060c272ff9a2412ec2e711a3e4a5e6e", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.8278281550706775, "ground_truth": 0}, {"key": "186210bbc060c272ff9a2412ec2e711a3e4a5e6e", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.7704647810613793, "ground_truth": 0}, {"key": "186210bbc060c272ff9a2412ec2e711a3e4a5e6e", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.7185944132691401, "ground_truth": 0}, {"key": "03392835ea832d7940082c421a21778c70701ff0", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.8289388225471671, "ground_truth": 0}, {"key": "03392835ea832d7940082c421a21778c70701ff0", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.884837777575793, "ground_truth": 0}, {"key": "03392835ea832d7940082c421a21778c70701ff0", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.7826624870969227, "ground_truth": 0}, {"key": "03392835ea832d7940082c421a21778c70701ff0", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.8376199707656262, "ground_truth": 0}, {"key": "03392835ea832d7940082c421a21778c70701ff0", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.8624675321912606, "ground_truth": 0}, {"key": "e2b96982b60cbd10b39c1db4282023d0ac1f3f2a", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.9381240129272135, "ground_truth": 0}, {"key": "e2b96982b60cbd10b39c1db4282023d0ac1f3f2a", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.9462003580607135, "ground_truth": 0}, {"key": "e2b96982b60cbd10b39c1db4282023d0ac1f3f2a", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.9219218410899239, "ground_truth": 0}, {"key": "e2b96982b60cbd10b39c1db4282023d0ac1f3f2a", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.8824278620185176, "ground_truth": 0}, {"key": "e2b96982b60cbd10b39c1db4282023d0ac1f3f2a", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.9358173561455556, "ground_truth": 0}, {"key": "31310358d02c98abba71916e8cb4ef7477a2d82a", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.7106283140518913, "ground_truth": 0}, {"key": "31310358d02c98abba71916e8cb4ef7477a2d82a", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.8006920087927151, "ground_truth": 0}, {"key": "31310358d02c98abba71916e8cb4ef7477a2d82a", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.7676898524136062, "ground_truth": 0}, {"key": "31310358d02c98abba71916e8cb4ef7477a2d82a", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.6740504785218787, "ground_truth": 0}, {"key": "31310358d02c98abba71916e8cb4ef7477a2d82a", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.7534666714735965, "ground_truth": 0}, {"key": "ec0e9a0c77bbb4bba73ef5177413c666e691850d", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.8354835358751586, "ground_truth": 0}, {"key": "ec0e9a0c77bbb4bba73ef5177413c666e691850d", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.9425067266354205, "ground_truth": 0}, {"key": "ec0e9a0c77bbb4bba73ef5177413c666e691850d", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.8624675299158512, "ground_truth": 0}, {"key": "ec0e9a0c77bbb4bba73ef5177413c666e691850d", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.8529354691117536, "ground_truth": 0}, {"key": "ec0e9a0c77bbb4bba73ef5177413c666e691850d", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.7969253754626093, "ground_truth": 0}, {"key": "02311be4aab97a81d2262963896b975c27f6503d", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.909264514499294, "ground_truth": 0}, {"key": "02311be4aab97a81d2262963896b975c27f6503d", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.9005297898735891, "ground_truth": 0}, {"key": "02311be4aab97a81d2262963896b975c27f6503d", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.9465966656107615, "ground_truth": 0}, {"key": "02311be4aab97a81d2262963896b975c27f6503d", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.8976952966501721, "ground_truth": 0}, {"key": "02311be4aab97a81d2262963896b975c27f6503d", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.9362850056241722, "ground_truth": 0}, {"key": "a18b463219c663ef55a0cbbf81ae489cdf877b62", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.9906599752462165, "ground_truth": 0}, {"key": "a18b463219c663ef55a0cbbf81ae489cdf877b62", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.9918752906421273, "ground_truth": 0}, {"key": "a18b463219c663ef55a0cbbf81ae489cdf877b62", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.994615061912377, "ground_truth": 0}, {"key": "a18b463219c663ef55a0cbbf81ae489cdf877b62", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.9920002462284849, "ground_truth": 0}, {"key": "a18b463219c663ef55a0cbbf81ae489cdf877b62", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.9913558222046093, "ground_truth": 0}, {"key": "aa966ac9e3611ac2cef8d3fb9ceb3b58c150e238", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.960951707791109, "ground_truth": 0}, {"key": "aa966ac9e3611ac2cef8d3fb9ceb3b58c150e238", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.9572778038194293, "ground_truth": 0}, {"key": "aa966ac9e3611ac2cef8d3fb9ceb3b58c150e238", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.9390248162192697, "ground_truth": 0}, {"key": "aa966ac9e3611ac2cef8d3fb9ceb3b58c150e238", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.9518632305146576, "ground_truth": 0}, {"key": "aa966ac9e3611ac2cef8d3fb9ceb3b58c150e238", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.9268352889038741, "ground_truth": 0}, {"key": "5215d4e6e945ba390786f1720cc5a8abf92c32fd", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.757794376435936, "ground_truth": 0}, {"key": "5215d4e6e945ba390786f1720cc5a8abf92c32fd", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.7122321950791719, "ground_truth": 0}, {"key": "5215d4e6e945ba390786f1720cc5a8abf92c32fd", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.8116760334835631, "ground_truth": 0}, {"key": "5215d4e6e945ba390786f1720cc5a8abf92c32fd", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.8019358176114902, "ground_truth": 0}, {"key": "5215d4e6e945ba390786f1720cc5a8abf92c32fd", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.7892336933566914, "ground_truth": 0}, {"key": "e7297f59909379c8eb07ea9bc2377b5e3980073d", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.6791786862760463, "ground_truth": 0}, {"key": "e7297f59909379c8eb07ea9bc2377b5e3980073d", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.7577943721010898, "ground_truth": 0}, {"key": "e7297f59909379c8eb07ea9bc2377b5e3980073d", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.7956580877399624, "ground_truth": 0}, {"key": "e7297f59909379c8eb07ea9bc2377b5e3980073d", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.7981867735047328, "ground_truth": 0}, {"key": "e7297f59909379c8eb07ea9bc2377b5e3980073d", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.8116760259275552, "ground_truth": 0}, {"key": "6c5f775006a225e617c1fa4cf0c439579e1443a2", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.8998277764629558, "ground_truth": 0}, {"key": "6c5f775006a225e617c1fa4cf0c439579e1443a2", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.8933094127375657, "ground_truth": 0}, {"key": "6c5f775006a225e617c1fa4cf0c439579e1443a2", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.8856314742863737, "ground_truth": 0}, {"key": "6c5f775006a225e617c1fa4cf0c439579e1443a2", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.8984105457482788, "ground_truth": 0}, {"key": "6c5f775006a225e617c1fa4cf0c439579e1443a2", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.851952808301041, "ground_truth": 0}, {"key": "46ce664a42eac4474d25c435a28790ec25137603", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.7866228295148427, "ground_truth": 0}, {"key": "46ce664a42eac4474d25c435a28790ec25137603", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.8596637550815204, "ground_truth": 0}, {"key": "46ce664a42eac4474d25c435a28790ec25137603", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.8652240871744057, "ground_truth": 0}, {"key": "46ce664a42eac4474d25c435a28790ec25137603", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.8300437754350125, "ground_truth": 0}, {"key": "46ce664a42eac4474d25c435a28790ec25137603", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.8723473748036444, "ground_truth": 0}, {"key": "693d73ab049f7d8f3c897922b3f7269a96a1a4fa", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.779992917276361, "ground_truth": 0}, {"key": "693d73ab049f7d8f3c897922b3f7269a96a1a4fa", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.6876299686659868, "ground_truth": 0}, {"key": "693d73ab049f7d8f3c897922b3f7269a96a1a4fa", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.7577943674017961, "ground_truth": 0}, {"key": "693d73ab049f7d8f3c897922b3f7269a96a1a4fa", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.7341195390907921, "ground_truth": 0}, {"key": "693d73ab049f7d8f3c897922b3f7269a96a1a4fa", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.7074047118377105, "ground_truth": 0}, {"key": "48e4930e3c380330b609f460f11520be0e29d5fd", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.8407825776347003, "ground_truth": 0}, {"key": "48e4930e3c380330b609f460f11520be0e29d5fd", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.8807970768820226, "ground_truth": 0}, {"key": "48e4930e3c380330b609f460f11520be0e29d5fd", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.8092759805763687, "ground_truth": 0}, {"key": "48e4930e3c380330b609f460f11520be0e29d5fd", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.8407825907937397, "ground_truth": 0}, {"key": "48e4930e3c380330b609f460f11520be0e29d5fd", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.8615382075131783, "ground_truth": 0}, {"key": "53f3e11ada213ff55b987692a2eb0c9b6d890d5e", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.7745833924128526, "ground_truth": 0}, {"key": "53f3e11ada213ff55b987692a2eb0c9b6d890d5e", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.7520125778431632, "ground_truth": 0}, {"key": "53f3e11ada213ff55b987692a2eb0c9b6d890d5e", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.785308580606123, "ground_truth": 0}, {"key": "53f3e11ada213ff55b987692a2eb0c9b6d890d5e", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.7356416363945283, "ground_truth": 0}, {"key": "53f3e11ada213ff55b987692a2eb0c9b6d890d5e", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.7772998452785326, "ground_truth": 0}, {"key": "d2ee859acf7e35bea229f968d53240c2f1c2845c", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.8344068879832386, "ground_truth": 0}, {"key": "d2ee859acf7e35bea229f968d53240c2f1c2845c", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.7772998758133227, "ground_truth": 0}, {"key": "d2ee859acf7e35bea229f968d53240c2f1c2845c", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.6740504929000635, "ground_truth": 0}, {"key": "d2ee859acf7e35bea229f968d53240c2f1c2845c", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.816406376889799, "ground_truth": 0}, {"key": "d2ee859acf7e35bea229f968d53240c2f1c2845c", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.8198933494294782, "ground_truth": 0}, {"key": "d4d44650eb77504fd01a730c0ccc7e6cdfcc578a", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.8984105536264275, "ground_truth": 0}, {"key": "d4d44650eb77504fd01a730c0ccc7e6cdfcc578a", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.9105454008543519, "ground_truth": 0}, {"key": "d4d44650eb77504fd01a730c0ccc7e6cdfcc578a", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.908617895452808, "ground_truth": 0}, {"key": "d4d44650eb77504fd01a730c0ccc7e6cdfcc578a", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.9304582591736735, "ground_truth": 0}, {"key": "d4d44650eb77504fd01a730c0ccc7e6cdfcc578a", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.9314625074998427, "ground_truth": 0}, {"key": "3695132378151f89d210da575bfef0a3f29aa051", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.9278877906852236, "ground_truth": 0}, {"key": "3695132378151f89d210da575bfef0a3f29aa051", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.9329437111613283, "ground_truth": 0}, {"key": "3695132378151f89d210da575bfef0a3f29aa051", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.9477691425960642, "ground_truth": 0}, {"key": "3695132378151f89d210da575bfef0a3f29aa051", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.9353465077492112, "ground_truth": 0}, {"key": "3695132378151f89d210da575bfef0a3f29aa051", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.9046505419029027, "ground_truth": 0}, {"key": "c193cecd478fa204b16500ece25bf25b75bc5265", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.9161096140026682, "ground_truth": 0}, {"key": "c193cecd478fa204b16500ece25bf25b75bc5265", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.8976952897730265, "ground_truth": 0}, {"key": "c193cecd478fa204b16500ece25bf25b75bc5265", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.878314244387601, "ground_truth": 0}, {"key": "c193cecd478fa204b16500ece25bf25b75bc5265", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.9149009552099595, "ground_truth": 0}, {"key": "c193cecd478fa204b16500ece25bf25b75bc5265", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.9319595782942602, "ground_truth": 0}, {"key": "b599d61b0c28b86dc92c7af4d40814ece8279500", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.8278281562549167, "ground_truth": 0}, {"key": "b599d61b0c28b86dc92c7af4d40814ece8279500", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.7476159760553014, "ground_truth": 0}, {"key": "b599d61b0c28b86dc92c7af4d40814ece8279500", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.7772998512104511, "ground_truth": 0}, {"key": "b599d61b0c28b86dc92c7af4d40814ece8279500", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.710628323588297, "ground_truth": 0}, {"key": "b599d61b0c28b86dc92c7af4d40814ece8279500", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.7025300616487263, "ground_truth": 0}, {"key": "06f290a163e81c46437ca61b5fd13741d7db11f2", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.6334102896420396, "ground_truth": 0}, {"key": "06f290a163e81c46437ca61b5fd13741d7db11f2", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.8679338473657953, "ground_truth": 0}, {"key": "06f290a163e81c46437ca61b5fd13741d7db11f2", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.7371581511855334, "ground_truth": 0}, {"key": "06f290a163e81c46437ca61b5fd13741d7db11f2", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.6020615890525679, "ground_truth": 0}, {"key": "06f290a163e81c46437ca61b5fd13741d7db11f2", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.7090191233154985, "ground_truth": 0}, {"key": "46210bd0b15cd5bba64751d873674766decb2677", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.8596637485694056, "ground_truth": 0}, {"key": "46210bd0b15cd5bba64751d873674766decb2677", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.9079671367486656, "ground_truth": 0}, {"key": "46210bd0b15cd5bba64751d873674766decb2677", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.8255897166494068, "ground_truth": 0}, {"key": "46210bd0b15cd5bba64751d873674766decb2677", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.8438951039141103, "ground_truth": 0}, {"key": "46210bd0b15cd5bba64751d873674766decb2677", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.8740772318698923, "ground_truth": 0}, {"key": "cfba701dad16c47e0f7b97b8a6b043d25f740085", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.8757869987525075, "ground_truth": 0}, {"key": "cfba701dad16c47e0f7b97b8a6b043d25f740085", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.8056321703193932, "ground_truth": 0}, {"key": "cfba701dad16c47e0f7b97b8a6b043d25f740085", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.8895288457084762, "ground_truth": 0}, {"key": "cfba701dad16c47e0f7b97b8a6b043d25f740085", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.8864204119651623, "ground_truth": 0}, {"key": "cfba701dad16c47e0f7b97b8a6b043d25f740085", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.8267117830546259, "ground_truth": 0}, {"key": "1c0fbe7e6758334d83d145580688e7aa1c549c53", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.8856314747261256, "ground_truth": 0}, {"key": "1c0fbe7e6758334d83d145580688e7aa1c549c53", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.8092759744794089, "ground_truth": 0}, {"key": "1c0fbe7e6758334d83d145580688e7aa1c549c53", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.9118099535900384, "ground_truth": 0}, {"key": "1c0fbe7e6758334d83d145580688e7aa1c549c53", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.8044059220109386, "ground_truth": 0}, {"key": "1c0fbe7e6758334d83d145580688e7aa1c549c53", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.8799743760520385, "ground_truth": 0}, {"key": "820c917dada8b32be365eaeec9edc1ca5833cfcd", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.9640516771018313, "ground_truth": 0}, {"key": "820c917dada8b32be365eaeec9edc1ca5833cfcd", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.9092645157763166, "ground_truth": 0}, {"key": "820c917dada8b32be365eaeec9edc1ca5833cfcd", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.9184802426582892, "ground_truth": 0}, {"key": "820c917dada8b32be365eaeec9edc1ca5833cfcd", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.925229962787184, "ground_truth": 0}, {"key": "820c917dada8b32be365eaeec9edc1ca5833cfcd", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.932943708666523, "ground_truth": 0}, {"key": "faf3821150b0c63290cbbddd7a8b54900995ea5a", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.6370307759431659, "ground_truth": 0}, {"key": "faf3821150b0c63290cbbddd7a8b54900995ea5a", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.6654105665108436, "ground_truth": 0}, {"key": "faf3821150b0c63290cbbddd7a8b54900995ea5a", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.6531269201101356, "ground_truth": 0}, {"key": "faf3821150b0c63290cbbddd7a8b54900995ea5a", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.7918210827956654, "ground_truth": 0}, {"key": "faf3821150b0c63290cbbddd7a8b54900995ea5a", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.7549149971686998, "ground_truth": 0}, {"key": "1de0cae2832cf41f49e6fad8254247c789dfabd2", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.8577681121671087, "ground_truth": 0}, {"key": "1de0cae2832cf41f49e6fad8254247c789dfabd2", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.8587185894148811, "ground_truth": 0}, {"key": "1de0cae2832cf41f49e6fad8254247c789dfabd2", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.7138307681222538, "ground_truth": 0}, {"key": "1de0cae2832cf41f49e6fad8254247c789dfabd2", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.6566582302527348, "ground_truth": 0}, {"key": "1de0cae2832cf41f49e6fad8254247c789dfabd2", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.8322366433555205, "ground_truth": 0}, {"key": "6c6e51ef20def117ed9114ed8d8480b3a100f1c3", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.9289263368956291, "ground_truth": 0}, {"key": "6c6e51ef20def117ed9114ed8d8480b3a100f1c3", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.9053222996391589, "ground_truth": 0}, {"key": "6c6e51ef20def117ed9114ed8d8480b3a100f1c3", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.8210441213112075, "ground_truth": 0}, {"key": "6c6e51ef20def117ed9114ed8d8480b3a100f1c3", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.822189134688594, "ground_truth": 0}, {"key": "6c6e51ef20def117ed9114ed8d8480b3a100f1c3", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.8661325258275959, "ground_truth": 0}, {"key": "b8c755b8921f7917d161605d2ef404d9551f3846", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.8998277829328818, "ground_truth": 0}, {"key": "b8c755b8921f7917d161605d2ef404d9551f3846", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.830043753690628, "ground_truth": 0}, {"key": "b8c755b8921f7917d161605d2ef404d9551f3846", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.8947894637497906, "ground_truth": 0}, {"key": "b8c755b8921f7917d161605d2ef404d9551f3846", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.9184802471686958, "ground_truth": 0}, {"key": "b8c755b8921f7917d161605d2ef404d9551f3846", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.8832359880998146, "ground_truth": 0}, {"key": "dc7e18d14b8ad29abbd79f554324ec7b8ba8b9c0", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.9284088026021606, "ground_truth": 0}, {"key": "dc7e18d14b8ad29abbd79f554324ec7b8ba8b9c0", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.9579122731852738, "ground_truth": 0}, {"key": "dc7e18d14b8ad29abbd79f554324ec7b8ba8b9c0", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.928926328175812, "ground_truth": 0}, {"key": "dc7e18d14b8ad29abbd79f554324ec7b8ba8b9c0", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.9099070044985179, "ground_truth": 0}, {"key": "dc7e18d14b8ad29abbd79f554324ec7b8ba8b9c0", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.9142907208031271, "ground_truth": 0}, {"key": "a7fc90db6c296663b1b7fc057451dfd45019342d", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.7461389794507612, "ground_truth": 0}, {"key": "a7fc90db6c296663b1b7fc057451dfd45019342d", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.867035762111826, "ground_truth": 0}, {"key": "a7fc90db6c296663b1b7fc057451dfd45019342d", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.6424324645736575, "ground_truth": 0}, {"key": "a7fc90db6c296663b1b7fc057451dfd45019342d", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.6654105579451948, "ground_truth": 0}, {"key": "a7fc90db6c296663b1b7fc057451dfd45019342d", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.6206216205824395, "ground_truth": 0}, {"key": "7f22fbc4fd81e50c632c5853856965aa4d0065d4", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.9319595778183328, "ground_truth": 0}, {"key": "7f22fbc4fd81e50c632c5853856965aa4d0065d4", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.9241418236066501, "ground_truth": 0}, {"key": "7f22fbc4fd81e50c632c5853856965aa4d0065d4", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.9092645153651209, "ground_truth": 0}, {"key": "7f22fbc4fd81e50c632c5853856965aa4d0065d4", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.8976952974243391, "ground_truth": 0}, {"key": "7f22fbc4fd81e50c632c5853856965aa4d0065d4", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.9190632905419599, "ground_truth": 0}, {"key": "309ae632df7b88a9569d81fa91aff3b9fb03529e", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.8766343826825204, "ground_truth": 0}, {"key": "309ae632df7b88a9569d81fa91aff3b9fb03529e", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.7786493113775734, "ground_truth": 0}, {"key": "309ae632df7b88a9569d81fa91aff3b9fb03529e", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.8902942290515333, "ground_truth": 0}, {"key": "309ae632df7b88a9569d81fa91aff3b9fb03529e", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.7866228365696009, "ground_truth": 0}, {"key": "309ae632df7b88a9569d81fa91aff3b9fb03529e", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.9086178931542963, "ground_truth": 0}, {"key": "732304a0901ff14d023d4361c1d41a85724808f3", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.7956580933033631, "ground_truth": 0}, {"key": "732304a0901ff14d023d4361c1d41a85724808f3", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.8386797670741013, "ground_truth": 0}, {"key": "732304a0901ff14d023d4361c1d41a85724808f3", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.7074047031816174, "ground_truth": 0}, {"key": "732304a0901ff14d023d4361c1d41a85724808f3", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.6057990520380382, "ground_truth": 0}, {"key": "732304a0901ff14d023d4361c1d41a85724808f3", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.7025300260877125, "ground_truth": 0}, {"key": "509b9f69b376e4acb8da49d53198699b1e779ea7", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.6943026509603002, "ground_truth": 0}, {"key": "509b9f69b376e4acb8da49d53198699b1e779ea7", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.7248702800870793, "ground_truth": 0}, {"key": "509b9f69b376e4acb8da49d53198699b1e779ea7", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.8740772393340203, "ground_truth": 0}, {"key": "509b9f69b376e4acb8da49d53198699b1e779ea7", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.747615946198445, "ground_truth": 0}, {"key": "509b9f69b376e4acb8da49d53198699b1e779ea7", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.8128673274412327, "ground_truth": 0}, {"key": "c292860b41f7c9131458cdc44a79febef38ad8a2", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.8459424317639281, "ground_truth": 0}, {"key": "c292860b41f7c9131458cdc44a79febef38ad8a2", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.8210441130791144, "ground_truth": 0}, {"key": "c292860b41f7c9131458cdc44a79febef38ad8a2", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.7461389893816347, "ground_truth": 0}, {"key": "c292860b41f7c9131458cdc44a79febef38ad8a2", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.860603628738228, "ground_truth": 0}, {"key": "c292860b41f7c9131458cdc44a79febef38ad8a2", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.8984105500627455, "ground_truth": 0}, {"key": "6db7e70883f0241081833487c421bab86fdac26e", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.8152324910983683, "ground_truth": 0}, {"key": "6db7e70883f0241081833487c421bab86fdac26e", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.794384954513738, "ground_truth": 0}, {"key": "6db7e70883f0241081833487c421bab86fdac26e", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.7676898616863942, "ground_truth": 0}, {"key": "6db7e70883f0241081833487c421bab86fdac26e", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.7905303048778071, "ground_truth": 0}, {"key": "6db7e70883f0241081833487c421bab86fdac26e", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.8705972679771472, "ground_truth": 0}, {"key": "e51e06234b3f49da16fec69aaee6fb9cd09cb1d8", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.7549149671709781, "ground_truth": 0}, {"key": "e51e06234b3f49da16fec69aaee6fb9cd09cb1d8", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.7759445515277507, "ground_truth": 0}, {"key": "e51e06234b3f49da16fec69aaee6fb9cd09cb1d8", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.8568123030236866, "ground_truth": 0}, {"key": "e51e06234b3f49da16fec69aaee6fb9cd09cb1d8", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.7905303049317568, "ground_truth": 0}, {"key": "e51e06234b3f49da16fec69aaee6fb9cd09cb1d8", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.8244619352568198, "ground_truth": 0}, {"key": "42474528588bac3a27842671a3fa940fed450552", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.9485372358471155, "ground_truth": 0}, {"key": "42474528588bac3a27842671a3fa940fed450552", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.9376689610004217, "ground_truth": 0}, {"key": "42474528588bac3a27842671a3fa940fed450552", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.9445872068049339, "ground_truth": 0}, {"key": "42474528588bac3a27842671a3fa940fed450552", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.9569571492075201, "ground_truth": 0}, {"key": "42474528588bac3a27842671a3fa940fed450552", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.9224823509862903, "ground_truth": 0}, {"key": "5932d9c8f1da55bad396197ebae0853c515180a5", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.8568122905844442, "ground_truth": 0}, {"key": "5932d9c8f1da55bad396197ebae0853c515180a5", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.8529354695473854, "ground_truth": 0}, {"key": "5932d9c8f1da55bad396197ebae0853c515180a5", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.9066531304716972, "ground_truth": 0}, {"key": "5932d9c8f1da55bad396197ebae0853c515180a5", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.8459424360461897, "ground_truth": 0}, {"key": "5932d9c8f1da55bad396197ebae0853c515180a5", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.9046505403551867, "ground_truth": 0}, {"key": "daacc676fc659bfd147d11b1409ab42615a2f169", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.7931059350595167, "ground_truth": 0}, {"key": "daacc676fc659bfd147d11b1409ab42615a2f169", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.8354835444835396, "ground_truth": 0}, {"key": "daacc676fc659bfd147d11b1409ab42615a2f169", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.7969253750924999, "ground_truth": 0}, {"key": "daacc676fc659bfd147d11b1409ab42615a2f169", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.781330621229834, "ground_truth": 0}, {"key": "daacc676fc659bfd147d11b1409ab42615a2f169", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.8322366533982283, "ground_truth": 0}, {"key": "7a02e707b139791920fb13115d6132541fff7d97", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.6001883805756043, "ground_truth": 0}, {"key": "7a02e707b139791920fb13115d6132541fff7d97", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.7325918492921771, "ground_truth": 0}, {"key": "7a02e707b139791920fb13115d6132541fff7d97", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.6992544417858695, "ground_truth": 0}, {"key": "7a02e707b139791920fb13115d6132541fff7d97", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.5, "ground_truth": 0}, {"key": "7a02e707b139791920fb13115d6132541fff7d97", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.7310585816956573, "ground_truth": 0}, {"key": "db1972f0204c7a9c292f4c85e8838251cb26625e", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.9219218329880817, "ground_truth": 0}, {"key": "db1972f0204c7a9c292f4c85e8838251cb26625e", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.89029421974968, "ground_truth": 0}, {"key": "db1972f0204c7a9c292f4c85e8838251cb26625e", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.8469578431477466, "ground_truth": 0}, {"key": "db1972f0204c7a9c292f4c85e8838251cb26625e", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.9385759596233443, "ground_truth": 0}, {"key": "db1972f0204c7a9c292f4c85e8838251cb26625e", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.9268352789054236, "ground_truth": 0}, {"key": "6defcdfd6995661fd681dc15163d67f6a5d6727b", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.8933093978774252, "ground_truth": 0}, {"key": "6defcdfd6995661fd681dc15163d67f6a5d6727b", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.787931180821668, "ground_truth": 0}, {"key": "6defcdfd6995661fd681dc15163d67f6a5d6727b", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.9196425319070004, "ground_truth": 0}, {"key": "6defcdfd6995661fd681dc15163d67f6a5d6727b", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.9039745092256559, "ground_truth": 0}, {"key": "6defcdfd6995661fd681dc15163d67f6a5d6727b", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.8962513734442421, "ground_truth": 0}, {"key": "24716f5a39d23dafbe9a9df8fa002788d14d020b", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.8976952900126532, "ground_truth": 0}, {"key": "24716f5a39d23dafbe9a9df8fa002788d14d020b", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.9079671371122098, "ground_truth": 0}, {"key": "24716f5a39d23dafbe9a9df8fa002788d14d020b", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.888758782649296, "ground_truth": 0}, {"key": "24716f5a39d23dafbe9a9df8fa002788d14d020b", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.9263037288498005, "ground_truth": 0}, {"key": "24716f5a39d23dafbe9a9df8fa002788d14d020b", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.8955226805256673, "ground_truth": 0}, {"key": "ab3c98cf7833b842898a568d872e45ceb2f7dda9", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.670608293316929, "ground_truth": 0}, {"key": "ab3c98cf7833b842898a568d872e45ceb2f7dda9", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.7662936596208069, "ground_truth": 0}, {"key": "ab3c98cf7833b842898a568d872e45ceb2f7dda9", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.7676898572101513, "ground_truth": 0}, {"key": "ab3c98cf7833b842898a568d872e45ceb2f7dda9", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.6859494566306914, "ground_truth": 0}, {"key": "ab3c98cf7833b842898a568d872e45ceb2f7dda9", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.7981867727034013, "ground_truth": 0}, {"key": "831005755f85012c882f17c3b3699b34a7febb7b", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.9268352778002908, "ground_truth": 0}, {"key": "831005755f85012c882f17c3b3699b34a7febb7b", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.965381163175322, "ground_truth": 0}, {"key": "831005755f85012c882f17c3b3699b34a7febb7b", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.9235923077427954, "ground_truth": 0}, {"key": "831005755f85012c882f17c3b3699b34a7febb7b", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.9572778007976686, "ground_truth": 0}, {"key": "831005755f85012c882f17c3b3699b34a7febb7b", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.8991213823911514, "ground_truth": 0}, {"key": "0590a8c653b7d332d9df195dcf3ce014abb4eff7", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.9314625107244968, "ground_truth": 0}, {"key": "0590a8c653b7d332d9df195dcf3ce014abb4eff7", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.8529354644183402, "ground_truth": 0}, {"key": "0590a8c653b7d332d9df195dcf3ce014abb4eff7", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.933914623512347, "ground_truth": 0}, {"key": "0590a8c653b7d332d9df195dcf3ce014abb4eff7", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.9289263345170427, "ground_truth": 0}, {"key": "0590a8c653b7d332d9df195dcf3ce014abb4eff7", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.9511422186577636, "ground_truth": 0}, {"key": "f79341438eed40986c3219b67a3b5d87eb6c018a", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.9722043741074885, "ground_truth": 0}, {"key": "f79341438eed40986c3219b67a3b5d87eb6c018a", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.9704646630688372, "ground_truth": 0}, {"key": "f79341438eed40986c3219b67a3b5d87eb6c018a", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.9865717440943451, "ground_truth": 0}, {"key": "f79341438eed40986c3219b67a3b5d87eb6c018a", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.9726235112479256, "ground_truth": 0}, {"key": "f79341438eed40986c3219b67a3b5d87eb6c018a", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.9726235098970161, "ground_truth": 0}, {"key": "8db6225f67580d64a196f2f3197386a6be950a09", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.9788748080046565, "ground_truth": 0}, {"key": "8db6225f67580d64a196f2f3197386a6be950a09", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.9884026388325334, "ground_truth": 0}, {"key": "8db6225f67580d64a196f2f3197386a6be950a09", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.981453435437373, "ground_truth": 0}, {"key": "8db6225f67580d64a196f2f3197386a6be950a09", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.9824231155981814, "ground_truth": 0}, {"key": "8db6225f67580d64a196f2f3197386a6be950a09", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.9790357586871116, "ground_truth": 0}, {"key": "e386d9ed70bac668fa6048b572f445d9b7b62f75", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.8519528148184279, "ground_truth": 0}, {"key": "e386d9ed70bac668fa6048b572f445d9b7b62f75", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.8848377636755385, "ground_truth": 0}, {"key": "e386d9ed70bac668fa6048b572f445d9b7b62f75", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.8933094076408847, "ground_truth": 0}, {"key": "e386d9ed70bac668fa6048b572f445d9b7b62f75", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.927887799977546, "ground_truth": 0}, {"key": "e386d9ed70bac668fa6048b572f445d9b7b62f75", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.8998277853435529, "ground_truth": 0}, {"key": "e35669d4530ea55bc8f0e451268cab9e9eaeab92", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.8267118005910625, "ground_truth": 0}, {"key": "e35669d4530ea55bc8f0e451268cab9e9eaeab92", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.8783142468620112, "ground_truth": 0}, {"key": "e35669d4530ea55bc8f0e451268cab9e9eaeab92", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.8643104586941487, "ground_truth": 0}, {"key": "e35669d4530ea55bc8f0e451268cab9e9eaeab92", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.8832359800366768, "ground_truth": 0}, {"key": "e35669d4530ea55bc8f0e451268cab9e9eaeab92", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.8128673096363854, "ground_truth": 0}, {"key": "d3ca193f45aef9aa766d52fbc58d6b8f1658ee60", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.7994423059672084, "ground_truth": 0}, {"key": "d3ca193f45aef9aa766d52fbc58d6b8f1658ee60", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.8872046002183553, "ground_truth": 0}, {"key": "d3ca193f45aef9aa766d52fbc58d6b8f1658ee60", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.777299849977379, "ground_truth": 0}, {"key": "d3ca193f45aef9aa766d52fbc58d6b8f1658ee60", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.839733973133205, "ground_truth": 0}, {"key": "d3ca193f45aef9aa766d52fbc58d6b8f1658ee60", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.7905303080463733, "ground_truth": 0}, {"key": "1ca9bf09bf534add02b7cfe6ebae6d17cde66286", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.9511422211589632, "ground_truth": 0}, {"key": "1ca9bf09bf534add02b7cfe6ebae6d17cde66286", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.8940517155235336, "ground_truth": 0}, {"key": "1ca9bf09bf534add02b7cfe6ebae6d17cde66286", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.8925625304150566, "ground_truth": 0}, {"key": "1ca9bf09bf534add02b7cfe6ebae6d17cde66286", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.8661325159703344, "ground_truth": 0}, {"key": "1ca9bf09bf534add02b7cfe6ebae6d17cde66286", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.9441768543734901, "ground_truth": 0}, {"key": "c296e88117bef515bd9b36ad560223df3fd2b84c", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.9273632928986485, "ground_truth": 0}, {"key": "c296e88117bef515bd9b36ad560223df3fd2b84c", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.8910549569216707, "ground_truth": 0}, {"key": "c296e88117bef515bd9b36ad560223df3fd2b84c", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.9053222981215424, "ground_truth": 0}, {"key": "c296e88117bef515bd9b36ad560223df3fd2b84c", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.926303727131762, "ground_truth": 0}, {"key": "c296e88117bef515bd9b36ad560223df3fd2b84c", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.9420819130458625, "ground_truth": 0}, {"key": "c5e11ee4c2f0ae511bd0e1fae2978d070b1efc15", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.7090191158611702, "ground_truth": 0}, {"key": "c5e11ee4c2f0ae511bd0e1fae2978d070b1efc15", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.8643104536638019, "ground_truth": 0}, {"key": "c5e11ee4c2f0ae511bd0e1fae2978d070b1efc15", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.8056321848274512, "ground_truth": 0}, {"key": "c5e11ee4c2f0ae511bd0e1fae2978d070b1efc15", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.8244619397580634, "ground_truth": 0}, {"key": "c5e11ee4c2f0ae511bd0e1fae2978d070b1efc15", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.7690802528550058, "ground_truth": 0}, {"key": "1fc2d1ecf1ffdc2f0b642b686e1c21de53a4fd28", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.8278281473083665, "ground_truth": 0}, {"key": "1fc2d1ecf1ffdc2f0b642b686e1c21de53a4fd28", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.8068526286551795, "ground_truth": 0}, {"key": "1fc2d1ecf1ffdc2f0b642b686e1c21de53a4fd28", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.8940517155051225, "ground_truth": 0}, {"key": "1fc2d1ecf1ffdc2f0b642b686e1c21de53a4fd28", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.845942441708553, "ground_truth": 0}, {"key": "1fc2d1ecf1ffdc2f0b642b686e1c21de53a4fd28", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.7813306199667616, "ground_truth": 0}, {"key": "6556c64821ece8123c130b27285efe9619c3c7fd", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.8479677547393316, "ground_truth": 0}, {"key": "6556c64821ece8123c130b27285efe9619c3c7fd", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.832236655269668, "ground_truth": 0}, {"key": "6556c64821ece8123c130b27285efe9619c3c7fd", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.8376199676258945, "ground_truth": 0}, {"key": "6556c64821ece8123c130b27285efe9619c3c7fd", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.8092759708671615, "ground_truth": 0}, {"key": "6556c64821ece8123c130b27285efe9619c3c7fd", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.8558511372818975, "ground_truth": 0}, {"key": "32ba61f4513f7ec21cedb6ddd2a8a93260f8cd56", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.8799743627314571, "ground_truth": 0}, {"key": "32ba61f4513f7ec21cedb6ddd2a8a93260f8cd56", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.900529795135464, "ground_truth": 0}, {"key": "32ba61f4513f7ec21cedb6ddd2a8a93260f8cd56", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.9118099592894315, "ground_truth": 0}, {"key": "32ba61f4513f7ec21cedb6ddd2a8a93260f8cd56", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.8688267780906883, "ground_truth": 0}, {"key": "32ba61f4513f7ec21cedb6ddd2a8a93260f8cd56", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.9219218379374899, "ground_truth": 0}, {"key": "1146cfc5981ce23511ac1bac5f3957c30bebc7b8", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.7170118852488369, "ground_truth": 0}, {"key": "1146cfc5981ce23511ac1bac5f3957c30bebc7b8", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.8587185825951075, "ground_truth": 0}, {"key": "1146cfc5981ce23511ac1bac5f3957c30bebc7b8", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.7839884596781547, "ground_truth": 0}, {"key": "1146cfc5981ce23511ac1bac5f3957c30bebc7b8", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.7356416519051535, "ground_truth": 0}, {"key": "1146cfc5981ce23511ac1bac5f3957c30bebc7b8", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.694302649209092, "ground_truth": 0}, {"key": "e060abdb2a5e2ce6152ca0ed53703a9d17b2df36", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.7943849502717801, "ground_truth": 0}, {"key": "e060abdb2a5e2ce6152ca0ed53703a9d17b2df36", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.8816149010948701, "ground_truth": 0}, {"key": "e060abdb2a5e2ce6152ca0ed53703a9d17b2df36", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.8255897155563087, "ground_truth": 0}, {"key": "e060abdb2a5e2ce6152ca0ed53703a9d17b2df36", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.8152324823925384, "ground_truth": 0}, {"key": "e060abdb2a5e2ce6152ca0ed53703a9d17b2df36", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.8418256438034332, "ground_truth": 0}, {"key": "aef2a80ff67e87a8c165a481ede2a643128f4aa7", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.9458012667384579, "ground_truth": 0}, {"key": "aef2a80ff67e87a8c165a481ede2a643128f4aa7", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.9515039979529679, "ground_truth": 0}, {"key": "aef2a80ff67e87a8c165a481ede2a643128f4aa7", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.9376689589753001, "ground_truth": 0}, {"key": "aef2a80ff67e87a8c165a481ede2a643128f4aa7", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.9079671405290557, "ground_truth": 0}, {"key": "aef2a80ff67e87a8c165a481ede2a643128f4aa7", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.9053223031844319, "ground_truth": 0}, {"key": "d4eaedd7f1055f95e9cafa21e870d049f5df8526", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.556399612661799, "ground_truth": 0}, {"key": "d4eaedd7f1055f95e9cafa21e870d049f5df8526", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.6477982235604053, "ground_truth": 0}, {"key": "d4eaedd7f1055f95e9cafa21e870d049f5df8526", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.7074046949619639, "ground_truth": 0}, {"key": "d4eaedd7f1055f95e9cafa21e870d049f5df8526", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.6601723587932676, "ground_truth": 0}, {"key": "d4eaedd7f1055f95e9cafa21e870d049f5df8526", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.5983122056347432, "ground_truth": 0}, {"key": "ec9531cd58e385f0da60e23b2855a3c5ece3f270", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.7662936266194169, "ground_truth": 0}, {"key": "ec9531cd58e385f0da60e23b2855a3c5ece3f270", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.6424324635642958, "ground_truth": 0}, {"key": "ec9531cd58e385f0da60e23b2855a3c5ece3f270", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.5774953449103584, "ground_truth": 0}, {"key": "ec9531cd58e385f0da60e23b2855a3c5ece3f270", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.7490872242700028, "ground_truth": 0}, {"key": "ec9531cd58e385f0da60e23b2855a3c5ece3f270", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.700894803347522, "ground_truth": 0}, {"key": "b171bad51c8ec09118fd553347c41d9301f195ee", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.9473810484588269, "ground_truth": 0}, {"key": "b171bad51c8ec09118fd553347c41d9301f195ee", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.8548846396364191, "ground_truth": 0}, {"key": "b171bad51c8ec09118fd553347c41d9301f195ee", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.9507778823373505, "ground_truth": 0}, {"key": "b171bad51c8ec09118fd553347c41d9301f195ee", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.9500414749915723, "ground_truth": 0}, {"key": "b171bad51c8ec09118fd553347c41d9301f195ee", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.9059898201128087, "ground_truth": 0}, {"key": "1df14bd442bd39ed653aa77a1e77105d4b321db0", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.622459327839274, "ground_truth": 0}, {"key": "1df14bd442bd39ed653aa77a1e77105d4b321db0", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.8918110339603017, "ground_truth": 0}, {"key": "1df14bd442bd39ed653aa77a1e77105d4b321db0", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.9196425385422913, "ground_truth": 0}, {"key": "1df14bd442bd39ed653aa77a1e77105d4b321db0", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.8519527923879178, "ground_truth": 0}, {"key": "1df14bd442bd39ed653aa77a1e77105d4b321db0", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.7745833677535816, "ground_truth": 0}, {"key": "d4f57e3c18c38696345fb7a3d76a151bb9c5123b", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.881614902379188, "ground_truth": 0}, {"key": "d4f57e3c18c38696345fb7a3d76a151bb9c5123b", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.847967751949143, "ground_truth": 0}, {"key": "d4f57e3c18c38696345fb7a3d76a151bb9c5123b", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.8947894642515316, "ground_truth": 0}, {"key": "d4f57e3c18c38696345fb7a3d76a151bb9c5123b", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.8499711819459932, "ground_truth": 0}, {"key": "d4f57e3c18c38696345fb7a3d76a151bb9c5123b", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.9257686344833105, "ground_truth": 0}, {"key": "28bbbf57c580be154f0602cbfe8b63603ef5a3a4", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.5156199520018792, "ground_truth": 0}, {"key": "28bbbf57c580be154f0602cbfe8b63603ef5a3a4", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.5660185430041587, "ground_truth": 0}, {"key": "28bbbf57c580be154f0602cbfe8b63603ef5a3a4", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.6584175160541114, "ground_truth": 0}, {"key": "28bbbf57c580be154f0602cbfe8b63603ef5a3a4", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.7732163796535646, "ground_truth": 0}, {"key": "28bbbf57c580be154f0602cbfe8b63603ef5a3a4", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.5983122100548811, "ground_truth": 0}, {"key": "05850904cabf491c9ab7c0e0d85fd932eb8c0bb0", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.8615382022134672, "ground_truth": 0}, {"key": "05850904cabf491c9ab7c0e0d85fd932eb8c0bb0", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.8791467724724347, "ground_truth": 0}, {"key": "05850904cabf491c9ab7c0e0d85fd932eb8c0bb0", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.9046505331752622, "ground_truth": 0}, {"key": "05850904cabf491c9ab7c0e0d85fd932eb8c0bb0", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.9046505371234561, "ground_truth": 0}, {"key": "05850904cabf491c9ab7c0e0d85fd932eb8c0bb0", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.8991213769585846, "ground_truth": 0}, {"key": "df79c0f955e4ccf51ad45780f865e334d3577bf5", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.7592254227352411, "ground_truth": 0}, {"key": "df79c0f955e4ccf51ad45780f865e334d3577bf5", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.6601723900385049, "ground_truth": 0}, {"key": "df79c0f955e4ccf51ad45780f865e334d3577bf5", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.6495786145601804, "ground_truth": 0}, {"key": "df79c0f955e4ccf51ad45780f865e334d3577bf5", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.7662936212455779, "ground_truth": 0}, {"key": "df79c0f955e4ccf51ad45780f865e334d3577bf5", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.6654105334741951, "ground_truth": 0}, {"key": "ffb8b9be838da033f6f3383f324d425556723147", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.939024820929338, "ground_truth": 0}, {"key": "ffb8b9be838da033f6f3383f324d425556723147", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.8766343802956493, "ground_truth": 0}, {"key": "ffb8b9be838da033f6f3383f324d425556723147", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.8955226790125861, "ground_truth": 0}, {"key": "ffb8b9be838da033f6f3383f324d425556723147", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.9278878027133947, "ground_truth": 0}, {"key": "ffb8b9be838da033f6f3383f324d425556723147", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.9136765222962359, "ground_truth": 0}, {"key": "d70dcffc2c07e08cc121d7126ada53dbc479626e", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.8596637411679224, "ground_truth": 0}, {"key": "d70dcffc2c07e08cc121d7126ada53dbc479626e", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.8397339726616714, "ground_truth": 0}, {"key": "d70dcffc2c07e08cc121d7126ada53dbc479626e", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.8633916039863943, "ground_truth": 0}, {"key": "d70dcffc2c07e08cc121d7126ada53dbc479626e", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.7772998595520806, "ground_truth": 0}, {"key": "d70dcffc2c07e08cc121d7126ada53dbc479626e", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.8568122899509831, "ground_truth": 0}, {"key": "4dc0cef39980df6382f9aee5e150e904fe62965e", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.6688802473193107, "ground_truth": 0}, {"key": "4dc0cef39980df6382f9aee5e150e904fe62965e", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.7170118915597734, "ground_truth": 0}, {"key": "4dc0cef39980df6382f9aee5e150e904fe62965e", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.8080672317353043, "ground_truth": 0}, {"key": "4dc0cef39980df6382f9aee5e150e904fe62965e", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.6791787288179656, "ground_truth": 0}, {"key": "4dc0cef39980df6382f9aee5e150e904fe62965e", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.8056321874156777, "ground_truth": 0}, {"key": "6cb082c504e00c93686ff1e9287a84ba13c12b79", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.8019358306896173, "ground_truth": 0}, {"key": "6cb082c504e00c93686ff1e9287a84ba13c12b79", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.7122321851964918, "ground_truth": 0}, {"key": "6cb082c504e00c93686ff1e9287a84ba13c12b79", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.849971180124959, "ground_truth": 0}, {"key": "6cb082c504e00c93686ff1e9287a84ba13c12b79", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.7122321966214947, "ground_truth": 0}, {"key": "6cb082c504e00c93686ff1e9287a84ba13c12b79", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.918480251454764, "ground_truth": 0}, {"key": "19fe2a8e0bef37b495afcc83c2f46b60c56039bf", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.879146754080187, "ground_truth": 0}, {"key": "19fe2a8e0bef37b495afcc83c2f46b60c56039bf", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.6893056235242043, "ground_truth": 0}, {"key": "19fe2a8e0bef37b495afcc83c2f46b60c56039bf", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.8568122946452629, "ground_truth": 0}, {"key": "19fe2a8e0bef37b495afcc83c2f46b60c56039bf", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.8459424349958661, "ground_truth": 0}, {"key": "19fe2a8e0bef37b495afcc83c2f46b60c56039bf", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.7057850317349028, "ground_truth": 0}, {"key": "503c6aaeaf0e61372a896ebe1fdf2a2492844fe4", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.7041601422344677, "ground_truth": 0}, {"key": "503c6aaeaf0e61372a896ebe1fdf2a2492844fe4", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.6723316923373511, "ground_truth": 0}, {"key": "503c6aaeaf0e61372a896ebe1fdf2a2492844fe4", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.8386797668044861, "ground_truth": 0}, {"key": "503c6aaeaf0e61372a896ebe1fdf2a2492844fe4", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.7892336926323801, "ground_truth": 0}, {"key": "503c6aaeaf0e61372a896ebe1fdf2a2492844fe4", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.7201715110875242, "ground_truth": 0}, {"key": "e4007135fdafe84907e2b018da3a4c7ab853c251", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.8633915993783478, "ground_truth": 0}, {"key": "e4007135fdafe84907e2b018da3a4c7ab853c251", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.8596637575210083, "ground_truth": 0}, {"key": "e4007135fdafe84907e2b018da3a4c7ab853c251", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.7813306156163365, "ground_truth": 0}, {"key": "e4007135fdafe84907e2b018da3a4c7ab853c251", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.8376199673143758, "ground_truth": 0}, {"key": "e4007135fdafe84907e2b018da3a4c7ab853c251", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.8187367869440729, "ground_truth": 0}, {"key": "5b97a507eed113ce329e8c85078fb53033bbe567", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.8068526125286153, "ground_truth": 0}, {"key": "5b97a507eed113ce329e8c85078fb53033bbe567", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.7839884641535868, "ground_truth": 0}, {"key": "5b97a507eed113ce329e8c85078fb53033bbe567", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.7718435046210333, "ground_truth": 0}, {"key": "5b97a507eed113ce329e8c85078fb53033bbe567", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.7008948066694906, "ground_truth": 0}, {"key": "5b97a507eed113ce329e8c85078fb53033bbe567", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.8322366617696962, "ground_truth": 0}, {"key": "145a118e355e3a92383b41307a5b473a7c77a8bb", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.5813031059523797, "ground_truth": 0}, {"key": "145a118e355e3a92383b41307a5b473a7c77a8bb", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.6859494713347415, "ground_truth": 0}, {"key": "145a118e355e3a92383b41307a5b473a7c77a8bb", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.6334102866657508, "ground_truth": 0}, {"key": "145a118e355e3a92383b41307a5b473a7c77a8bb", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.7490872212203648, "ground_truth": 0}, {"key": "145a118e355e3a92383b41307a5b473a7c77a8bb", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.7090191484597642, "ground_truth": 0}, {"key": "1f6309c88c5711b2b579e3c0cf699c44d3b56d16", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.8104789209790643, "ground_truth": 0}, {"key": "1f6309c88c5711b2b579e3c0cf699c44d3b56d16", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.7905303335050055, "ground_truth": 0}, {"key": "1f6309c88c5711b2b579e3c0cf699c44d3b56d16", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.7879312029327352, "ground_truth": 0}, {"key": "1f6309c88c5711b2b579e3c0cf699c44d3b56d16", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.7813306373117294, "ground_truth": 0}, {"key": "1f6309c88c5711b2b579e3c0cf699c44d3b56d16", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.7431680076795363, "ground_truth": 0}, {"key": "d8304c60e76a4b16053e74c50abd886dcdf7397c", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.7745833911028311, "ground_truth": 0}, {"key": "d8304c60e76a4b16053e74c50abd886dcdf7397c", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.7122321869372783, "ground_truth": 0}, {"key": "d8304c60e76a4b16053e74c50abd886dcdf7397c", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.7943849687199183, "ground_truth": 0}, {"key": "d8304c60e76a4b16053e74c50abd886dcdf7397c", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.7981867745232103, "ground_truth": 0}, {"key": "d8304c60e76a4b16053e74c50abd886dcdf7397c", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.7577944004811973, "ground_truth": 0}, {"key": "d47e5724a866cf365428dbded7740555e5f80f2b", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.7106282895530206, "ground_truth": 0}, {"key": "d47e5724a866cf365428dbded7740555e5f80f2b", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.9252299536581488, "ground_truth": 0}, {"key": "d47e5724a866cf365428dbded7740555e5f80f2b", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.8104789079476099, "ground_truth": 0}, {"key": "d47e5724a866cf365428dbded7740555e5f80f2b", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.8354835399729691, "ground_truth": 0}, {"key": "d47e5724a866cf365428dbded7740555e5f80f2b", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.7264256056051992, "ground_truth": 0}, {"key": "0a078513cee66db2ccaaca1b7b0755c96f0c5c8a", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.9066531163558337, "ground_truth": 0}, {"key": "0a078513cee66db2ccaaca1b7b0755c96f0c5c8a", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.914900949910652, "ground_truth": 0}, {"key": "0a078513cee66db2ccaaca1b7b0755c96f0c5c8a", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.8799743672074604, "ground_truth": 0}, {"key": "0a078513cee66db2ccaaca1b7b0755c96f0c5c8a", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.867933847900626, "ground_truth": 0}, {"key": "0a078513cee66db2ccaaca1b7b0755c96f0c5c8a", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.8289387980628745, "ground_truth": 0}, {"key": "f0d93bdd383762936746b48f7e67ffe72cfb1ede", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.8311430700959507, "ground_truth": 0}, {"key": "f0d93bdd383762936746b48f7e67ffe72cfb1ede", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.8624675271609064, "ground_truth": 0}, {"key": "f0d93bdd383762936746b48f7e67ffe72cfb1ede", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.6909762959282707, "ground_truth": 0}, {"key": "f0d93bdd383762936746b48f7e67ffe72cfb1ede", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.7295197682503433, "ground_truth": 0}, {"key": "f0d93bdd383762936746b48f7e67ffe72cfb1ede", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.7325918344326677, "ground_truth": 0}, {"key": "38649fdccec39afa649297349b2ad2e5e1a39d82", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.9149009463774918, "ground_truth": 0}, {"key": "38649fdccec39afa649297349b2ad2e5e1a39d82", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.9246876957930861, "ground_truth": 0}, {"key": "38649fdccec39afa649297349b2ad2e5e1a39d82", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.8984105542336923, "ground_truth": 0}, {"key": "38649fdccec39afa649297349b2ad2e5e1a39d82", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.9079671340489858, "ground_truth": 0}, {"key": "38649fdccec39afa649297349b2ad2e5e1a39d82", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.846957861903918, "ground_truth": 0}, {"key": "d86d9a4e0b39556578f24ff54ed82716f0375fdb", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.9111797079901597, "ground_truth": 0}, {"key": "d86d9a4e0b39556578f24ff54ed82716f0375fdb", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.8732148275546332, "ground_truth": 0}, {"key": "d86d9a4e0b39556578f24ff54ed82716f0375fdb", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.8933093999036469, "ground_truth": 0}, {"key": "d86d9a4e0b39556578f24ff54ed82716f0375fdb", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.8749346204085805, "ground_truth": 0}, {"key": "d86d9a4e0b39556578f24ff54ed82716f0375fdb", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.8998277730797175, "ground_truth": 0}, {"key": "d10d57811499caa54276d3e14f89c45cb1a8958f", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.7879311902977563, "ground_truth": 0}, {"key": "d10d57811499caa54276d3e14f89c45cb1a8958f", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.7446563557966249, "ground_truth": 0}, {"key": "d10d57811499caa54276d3e14f89c45cb1a8958f", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.7620701095376863, "ground_truth": 0}, {"key": "d10d57811499caa54276d3e14f89c45cb1a8958f", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.7233094728923455, "ground_truth": 0}, {"key": "d10d57811499caa54276d3e14f89c45cb1a8958f", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.870597269405199, "ground_truth": 0}, {"key": "66646c49afb65308491ec8ca6db79aa76263cc69", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.7476159446660784, "ground_truth": 0}, {"key": "66646c49afb65308491ec8ca6db79aa76263cc69", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.744656330649854, "ground_truth": 0}, {"key": "66646c49afb65308491ec8ca6db79aa76263cc69", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.8278281512949409, "ground_truth": 0}, {"key": "66646c49afb65308491ec8ca6db79aa76263cc69", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.8289388081724731, "ground_truth": 0}, {"key": "66646c49afb65308491ec8ca6db79aa76263cc69", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.6513548809327068, "ground_truth": 0}, {"key": "7fbd6d867def06f6ae4c051562dc36ab8d0038c0", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.8991213859481313, "ground_truth": 0}, {"key": "7fbd6d867def06f6ae4c051562dc36ab8d0038c0", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.8902942199651724, "ground_truth": 0}, {"key": "7fbd6d867def06f6ae4c051562dc36ab8d0038c0", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.8509647035934067, "ground_truth": 0}, {"key": "7fbd6d867def06f6ae4c051562dc36ab8d0038c0", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.8198933290045446, "ground_truth": 0}, {"key": "7fbd6d867def06f6ae4c051562dc36ab8d0038c0", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.8418256467042576, "ground_truth": 0}, {"key": "5c243b51bf4de7f6974338d71ac26317254007bb", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.9130583424997301, "ground_truth": 0}, {"key": "5c243b51bf4de7f6974338d71ac26317254007bb", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.9092645162255973, "ground_truth": 0}, {"key": "5c243b51bf4de7f6974338d71ac26317254007bb", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.9481545314558656, "ground_truth": 0}, {"key": "5c243b51bf4de7f6974338d71ac26317254007bb", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.9130583449057182, "ground_truth": 0}, {"key": "5c243b51bf4de7f6974338d71ac26317254007bb", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.8918110429286318, "ground_truth": 0}, {"key": "56b79c03a77d5261382e4705f3537396473f55cf", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.8962513718040569, "ground_truth": 0}, {"key": "56b79c03a77d5261382e4705f3537396473f55cf", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.9019206789963259, "ground_truth": 0}, {"key": "56b79c03a77d5261382e4705f3537396473f55cf", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.9752018392230618, "ground_truth": 0}, {"key": "56b79c03a77d5261382e4705f3537396473f55cf", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.8661325221244275, "ground_truth": 0}, {"key": "56b79c03a77d5261382e4705f3537396473f55cf", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.9394706062251713, "ground_truth": 0}, {"key": "7382d171d71d3219c5ad0a13ea0ac92ac6b6998b", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.7839884504216864, "ground_truth": 0}, {"key": "7382d171d71d3219c5ad0a13ea0ac92ac6b6998b", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.7416740161807238, "ground_truth": 0}, {"key": "7382d171d71d3219c5ad0a13ea0ac92ac6b6998b", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.6671476554966957, "ground_truth": 0}, {"key": "7382d171d71d3219c5ad0a13ea0ac92ac6b6998b", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.8187368171097974, "ground_truth": 0}, {"key": "7382d171d71d3219c5ad0a13ea0ac92ac6b6998b", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.6926419816365004, "ground_truth": 0}, {"key": "ef1a5fa8dbba16e4d7ef3fc8cd540c2f55691fc8", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.9309620713076447, "ground_truth": 0}, {"key": "ef1a5fa8dbba16e4d7ef3fc8cd540c2f55691fc8", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.8872046089265752, "ground_truth": 0}, {"key": "ef1a5fa8dbba16e4d7ef3fc8cd540c2f55691fc8", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.9130583342163257, "ground_truth": 0}, {"key": "ef1a5fa8dbba16e4d7ef3fc8cd540c2f55691fc8", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.9224823429945608, "ground_truth": 0}, {"key": "ef1a5fa8dbba16e4d7ef3fc8cd540c2f55691fc8", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.9059898192455685, "ground_truth": 0}, {"key": "1ba0f66a7f4f23171634a3455893f4d5b8b94db4", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.8679338476195566, "ground_truth": 0}, {"key": "1ba0f66a7f4f23171634a3455893f4d5b8b94db4", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.874934614973366, "ground_truth": 0}, {"key": "1ba0f66a7f4f23171634a3455893f4d5b8b94db4", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.8895288565299746, "ground_truth": 0}, {"key": "1ba0f66a7f4f23171634a3455893f4d5b8b94db4", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.917302656376672, "ground_truth": 0}, {"key": "1ba0f66a7f4f23171634a3455893f4d5b8b94db4", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.8697145807040052, "ground_truth": 0}, {"key": "3131e8ba238a31d83cad00bc7b02933b0a3587b3", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.705785038562254, "ground_truth": 0}, {"key": "3131e8ba238a31d83cad00bc7b02933b0a3587b3", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.6859494713347415, "ground_truth": 0}, {"key": "3131e8ba238a31d83cad00bc7b02933b0a3587b3", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.690976298726627, "ground_truth": 0}, {"key": "3131e8ba238a31d83cad00bc7b02933b0a3587b3", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.7490872212203648, "ground_truth": 0}, {"key": "3131e8ba238a31d83cad00bc7b02933b0a3587b3", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.7090191484597642, "ground_truth": 0}, {"key": "112bc4ab4b6e7d6dd35fc33cd946fbfc4c9356d6", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.8783142471606, "ground_truth": 0}, {"key": "112bc4ab4b6e7d6dd35fc33cd946fbfc4c9356d6", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.8766343859358802, "ground_truth": 0}, {"key": "112bc4ab4b6e7d6dd35fc33cd946fbfc4c9356d6", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.8289388183932616, "ground_truth": 0}, {"key": "112bc4ab4b6e7d6dd35fc33cd946fbfc4c9356d6", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.8397339645525163, "ground_truth": 0}, {"key": "112bc4ab4b6e7d6dd35fc33cd946fbfc4c9356d6", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.8509646942772379, "ground_truth": 0}, {"key": "3b1d3309825780556178569cd40d880a793f8da7", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.8140528099565448, "ground_truth": 0}, {"key": "3b1d3309825780556178569cd40d880a793f8da7", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.741674012180068, "ground_truth": 0}, {"key": "3b1d3309825780556178569cd40d880a793f8da7", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.65135487138035, "ground_truth": 0}, {"key": "3b1d3309825780556178569cd40d880a793f8da7", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.6959583230968471, "ground_truth": 0}, {"key": "3b1d3309825780556178569cd40d880a793f8da7", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.6654105895385741, "ground_truth": 0}, {"key": "c977693b405a89cec98e53b05199e608fd6adeca", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.7074047132740295, "ground_truth": 0}, {"key": "c977693b405a89cec98e53b05199e608fd6adeca", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.8044059197608817, "ground_truth": 0}, {"key": "c977693b405a89cec98e53b05199e608fd6adeca", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.6842640180394751, "ground_truth": 0}, {"key": "c977693b405a89cec98e53b05199e608fd6adeca", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.8386797641671305, "ground_truth": 0}, {"key": "c977693b405a89cec98e53b05199e608fd6adeca", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.8233283821762108, "ground_truth": 0}, {"key": "c84e272a80fa95f863e016bc54df0841fd83fc12", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.6976089195560066, "ground_truth": 0}, {"key": "c84e272a80fa95f863e016bc54df0841fd83fc12", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.7994423189879089, "ground_truth": 0}, {"key": "c84e272a80fa95f863e016bc54df0841fd83fc12", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.5621764889465547, "ground_truth": 0}, {"key": "c84e272a80fa95f863e016bc54df0841fd83fc12", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.8152324853749203, "ground_truth": 0}, {"key": "c84e272a80fa95f863e016bc54df0841fd83fc12", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.8365545490271877, "ground_truth": 0}, {"key": "f51cff1d73cd0f3954376d7b3eab1d5b2ccb354c", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.8895288374400885, "ground_truth": 0}, {"key": "f51cff1d73cd0f3954376d7b3eab1d5b2ccb354c", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.8661325066628802, "ground_truth": 0}, {"key": "f51cff1d73cd0f3954376d7b3eab1d5b2ccb354c", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.8031738164062768, "ground_truth": 0}, {"key": "f51cff1d73cd0f3954376d7b3eab1d5b2ccb354c", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.8365545685168886, "ground_truth": 0}, {"key": "f51cff1d73cd0f3954376d7b3eab1d5b2ccb354c", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.8832359887872522, "ground_truth": 0}, {"key": "a98f1a0258f641788e570264b79e5c816f80054f", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.8740772249925527, "ground_truth": 0}, {"key": "a98f1a0258f641788e570264b79e5c816f80054f", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.7931059408777849, "ground_truth": 0}, {"key": "a98f1a0258f641788e570264b79e5c816f80054f", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.8221891164808164, "ground_truth": 0}, {"key": "a98f1a0258f641788e570264b79e5c816f80054f", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.7956580918070555, "ground_truth": 0}, {"key": "a98f1a0258f641788e570264b79e5c816f80054f", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.682573725846591, "ground_truth": 0}, {"key": "d69d50059c96bd729e9e4c54eee7901d43c0181d", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.929951039482204, "ground_truth": 0}, {"key": "d69d50059c96bd729e9e4c54eee7901d43c0181d", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.9196425325986444, "ground_truth": 0}, {"key": "d69d50059c96bd729e9e4c54eee7901d43c0181d", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.9518632317157885, "ground_truth": 0}, {"key": "d69d50059c96bd729e9e4c54eee7901d43c0181d", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.9412234417729464, "ground_truth": 0}, {"key": "d69d50059c96bd729e9e4c54eee7901d43c0181d", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.9066531275423865, "ground_truth": 0}, {"key": "379692c378381f092c0bae0516ea8abc5bdb98b8", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.7690802298556562, "ground_truth": 0}, {"key": "379692c378381f092c0bae0516ea8abc5bdb98b8", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.6548947415110834, "ground_truth": 0}, {"key": "379692c378381f092c0bae0516ea8abc5bdb98b8", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.77594454992902, "ground_truth": 0}, {"key": "379692c378381f092c0bae0516ea8abc5bdb98b8", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.7606506448956073, "ground_truth": 0}, {"key": "379692c378381f092c0bae0516ea8abc5bdb98b8", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.6842640117123381, "ground_truth": 0}, {"key": "88b0d86cd06cd05a090f6a6c3a3ed17bf5f96df3", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.9079671354870378, "ground_truth": 0}, {"key": "88b0d86cd06cd05a090f6a6c3a3ed17bf5f96df3", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.8856314771720469, "ground_truth": 0}, {"key": "88b0d86cd06cd05a090f6a6c3a3ed17bf5f96df3", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.8661325140056815, "ground_truth": 0}, {"key": "88b0d86cd06cd05a090f6a6c3a3ed17bf5f96df3", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.9019206816547469, "ground_truth": 0}, {"key": "88b0d86cd06cd05a090f6a6c3a3ed17bf5f96df3", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.8766343843119343, "ground_truth": 0}, {"key": "3b46e80db81819fdcb8b8044941f64d0fa5abd11", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.7662936592976245, "ground_truth": 0}, {"key": "3b46e80db81819fdcb8b8044941f64d0fa5abd11", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.6825737319363249, "ground_truth": 0}, {"key": "3b46e80db81819fdcb8b8044941f64d0fa5abd11", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.6261241815316719, "ground_truth": 0}, {"key": "3b46e80db81819fdcb8b8044941f64d0fa5abd11", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.8539127704973883, "ground_truth": 0}, {"key": "3b46e80db81819fdcb8b8044941f64d0fa5abd11", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.6842640372314766, "ground_truth": 0}, {"key": "786d56f09dae2902696b680395353986051a1139", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.7620701039380483, "ground_truth": 0}, {"key": "786d56f09dae2902696b680395353986051a1139", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.8068526187399939, "ground_truth": 0}, {"key": "786d56f09dae2902696b680395353986051a1139", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.791821064850988, "ground_truth": 0}, {"key": "786d56f09dae2902696b680395353986051a1139", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.6959583079398934, "ground_truth": 0}, {"key": "786d56f09dae2902696b680395353986051a1139", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.785308590717537, "ground_truth": 0}, {"key": "bf1a3fd65fdd6e91ccec0663d80fa567eada14df", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.9019206795704309, "ground_truth": 0}, {"key": "bf1a3fd65fdd6e91ccec0663d80fa567eada14df", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.8255897257952309, "ground_truth": 0}, {"key": "bf1a3fd65fdd6e91ccec0663d80fa567eada14df", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.8019358207180847, "ground_truth": 0}, {"key": "bf1a3fd65fdd6e91ccec0663d80fa567eada14df", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.8322366638497942, "ground_truth": 0}, {"key": "bf1a3fd65fdd6e91ccec0663d80fa567eada14df", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.8774767957072811, "ground_truth": 0}, {"key": "a0bd3047a6de80e3924843f1961ce28347c6a548", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.7325918295220321, "ground_truth": 0}, {"key": "a0bd3047a6de80e3924843f1961ce28347c6a548", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.8244619325096256, "ground_truth": 0}, {"key": "a0bd3047a6de80e3924843f1961ce28347c6a548", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.8879840450546763, "ground_truth": 0}, {"key": "a0bd3047a6de80e3924843f1961ce28347c6a548", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.7074047242083197, "ground_truth": 0}, {"key": "a0bd3047a6de80e3924843f1961ce28347c6a548", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.8031737940837754, "ground_truth": 0}, {"key": "090d322e93af624203dbd5dc83403170071c9e6a", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.9086178925531849, "ground_truth": 0}, {"key": "090d322e93af624203dbd5dc83403170071c9e6a", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.9525741302766334, "ground_truth": 0}, {"key": "090d322e93af624203dbd5dc83403170071c9e6a", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.9073122223888967, "ground_truth": 0}, {"key": "090d322e93af624203dbd5dc83403170071c9e6a", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.9390248157146736, "ground_truth": 0}, {"key": "090d322e93af624203dbd5dc83403170071c9e6a", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.9086178960977814, "ground_truth": 0}, {"key": "ed5179817cb8f597a760800fcdce2b8e64fd30dc", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.7325918257709743, "ground_truth": 0}, {"key": "ed5179817cb8f597a760800fcdce2b8e64fd30dc", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.8479677517501871, "ground_truth": 0}, {"key": "ed5179817cb8f597a760800fcdce2b8e64fd30dc", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.8116760118886366, "ground_truth": 0}, {"key": "ed5179817cb8f597a760800fcdce2b8e64fd30dc", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.8221891398363839, "ground_truth": 0}, {"key": "ed5179817cb8f597a760800fcdce2b8e64fd30dc", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.8333245997226233, "ground_truth": 0}, {"key": "571a8023d0deed8c667dd41fed88290309e56927", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.6297746234947167, "ground_truth": 0}, {"key": "571a8023d0deed8c667dd41fed88290309e56927", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.8175744666755297, "ground_truth": 0}, {"key": "571a8023d0deed8c667dd41fed88290309e56927", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.5755879989991365, "ground_truth": 0}, {"key": "571a8023d0deed8c667dd41fed88290309e56927", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.6095241791049268, "ground_truth": 0}, {"key": "571a8023d0deed8c667dd41fed88290309e56927", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.6548947310132873, "ground_truth": 0}, {"key": "544d7c0cba7df38cc8dda8d0d91c6845cf5f52bb", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.6424324745365348, "ground_truth": 0}, {"key": "544d7c0cba7df38cc8dda8d0d91c6845cf5f52bb", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.7025300535331426, "ground_truth": 0}, {"key": "544d7c0cba7df38cc8dda8d0d91c6845cf5f52bb", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.8766343847656978, "ground_truth": 0}, {"key": "544d7c0cba7df38cc8dda8d0d91c6845cf5f52bb", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.7745833977077284, "ground_truth": 0}, {"key": "544d7c0cba7df38cc8dda8d0d91c6845cf5f52bb", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.8187367988218895, "ground_truth": 0}, {"key": "cbd3a0715a91ac8f651aa7b1f2c1fb37a2ef8a69", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.7264256087826046, "ground_truth": 0}, {"key": "cbd3a0715a91ac8f651aa7b1f2c1fb37a2ef8a69", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.7505527677491365, "ground_truth": 0}, {"key": "cbd3a0715a91ac8f651aa7b1f2c1fb37a2ef8a69", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.8152324754636432, "ground_truth": 0}, {"key": "cbd3a0715a91ac8f651aa7b1f2c1fb37a2ef8a69", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.7772998510639847, "ground_truth": 0}, {"key": "cbd3a0715a91ac8f651aa7b1f2c1fb37a2ef8a69", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.7813306467213648, "ground_truth": 0}, {"key": "4ca8b3cf75948dffea7b96e71bf1d9621107354b", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.9782188274382667, "ground_truth": 0}, {"key": "4ca8b3cf75948dffea7b96e71bf1d9621107354b", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.9775429446016408, "ground_truth": 0}, {"key": "4ca8b3cf75948dffea7b96e71bf1d9621107354b", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.9585377243136125, "ground_truth": 0}, {"key": "4ca8b3cf75948dffea7b96e71bf1d9621107354b", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.9778834094618593, "ground_truth": 0}, {"key": "4ca8b3cf75948dffea7b96e71bf1d9621107354b", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.9618217249364982, "ground_truth": 0}, {"key": "98f04e49605f36e0236b206fcb26a1549a7c00c6", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.7592254153462924, "ground_truth": 0}, {"key": "98f04e49605f36e0236b206fcb26a1549a7c00c6", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.8418256482302189, "ground_truth": 0}, {"key": "98f04e49605f36e0236b206fcb26a1549a7c00c6", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.8519527989305481, "ground_truth": 0}, {"key": "98f04e49605f36e0236b206fcb26a1549a7c00c6", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.7490871927517311, "ground_truth": 0}, {"key": "98f04e49605f36e0236b206fcb26a1549a7c00c6", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.8344068881969489, "ground_truth": 0}, {"key": "fb0003754a764d7f3252120de58b515d1f882556", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.9407897466182288, "ground_truth": 0}, {"key": "fb0003754a764d7f3252120de58b515d1f882556", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.8558511454312041, "ground_truth": 0}, {"key": "fb0003754a764d7f3252120de58b515d1f882556", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.9019206768476463, "ground_truth": 0}, {"key": "fb0003754a764d7f3252120de58b515d1f882556", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.8187367945970041, "ground_truth": 0}, {"key": "fb0003754a764d7f3252120de58b515d1f882556", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.7233094794388418, "ground_truth": 0}, {"key": "0130f10c1d700cf42cad5fd24b242667342c86be", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.8278281467310695, "ground_truth": 0}, {"key": "0130f10c1d700cf42cad5fd24b242667342c86be", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.82104410403328, "ground_truth": 0}, {"key": "0130f10c1d700cf42cad5fd24b242667342c86be", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.8688267776532407, "ground_truth": 0}, {"key": "0130f10c1d700cf42cad5fd24b242667342c86be", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.8661325049780306, "ground_truth": 0}, {"key": "0130f10c1d700cf42cad5fd24b242667342c86be", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.8116760205470729, "ground_truth": 0}, {"key": "fb8431bc320c2c1a6c32699da0fdae228ed8d73b", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.8006919934874551, "ground_truth": 0}, {"key": "fb8431bc320c2c1a6c32699da0fdae228ed8d73b", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.6825737135064059, "ground_truth": 0}, {"key": "fb8431bc320c2c1a6c32699da0fdae228ed8d73b", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.8044059252945334, "ground_truth": 0}, {"key": "fb8431bc320c2c1a6c32699da0fdae228ed8d73b", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.8365545604071405, "ground_truth": 0}, {"key": "fb8431bc320c2c1a6c32699da0fdae228ed8d73b", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.7662936663146408, "ground_truth": 0}, {"key": "875d564015e85f88103edf0b36ce10e292334902", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.9059898157037424, "ground_truth": 0}, {"key": "875d564015e85f88103edf0b36ce10e292334902", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.8509646881818725, "ground_truth": 0}, {"key": "875d564015e85f88103edf0b36ce10e292334902", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.7994423157589936, "ground_truth": 0}, {"key": "875d564015e85f88103edf0b36ce10e292334902", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.757794369937867, "ground_truth": 0}, {"key": "875d564015e85f88103edf0b36ce10e292334902", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.8910549436916473, "ground_truth": 0}, {"key": "53102b470b50905c033a90940fc6fa87190f7343", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.9032942119741212, "ground_truth": 0}, {"key": "53102b470b50905c033a90940fc6fa87190f7343", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.900529786438616, "ground_truth": 0}, {"key": "53102b470b50905c033a90940fc6fa87190f7343", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.9073122174900891, "ground_truth": 0}, {"key": "53102b470b50905c033a90940fc6fa87190f7343", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.8902942284045855, "ground_truth": 0}, {"key": "53102b470b50905c033a90940fc6fa87190f7343", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.7718435012443736, "ground_truth": 0}, {"key": "58776b77856719aff45f09e50d370f52c756dc10", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.7041601368292371, "ground_truth": 0}, {"key": "58776b77856719aff45f09e50d370f52c756dc10", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.8749346171372249, "ground_truth": 0}, {"key": "58776b77856719aff45f09e50d370f52c756dc10", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.7170118806616262, "ground_truth": 0}, {"key": "58776b77856719aff45f09e50d370f52c756dc10", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.873214824479868, "ground_truth": 0}, {"key": "58776b77856719aff45f09e50d370f52c756dc10", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.8428631347214152, "ground_truth": 0}, {"key": "1b1479bb6e290e86e4b2a1e862e06909a0a62f8e", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.8832359890955733, "ground_truth": 0}, {"key": "1b1479bb6e290e86e4b2a1e862e06909a0a62f8e", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.903294206922691, "ground_truth": 0}, {"key": "1b1479bb6e290e86e4b2a1e862e06909a0a62f8e", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.806852625450856, "ground_truth": 0}, {"key": "1b1479bb6e290e86e4b2a1e862e06909a0a62f8e", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.8887587907100183, "ground_truth": 0}, {"key": "1b1479bb6e290e86e4b2a1e862e06909a0a62f8e", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.8688267770568588, "ground_truth": 0}, {"key": "137019bb8262f8ab776ec6367a0ae4b020fa638e", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.8670357621326211, "ground_truth": 0}, {"key": "137019bb8262f8ab776ec6367a0ae4b020fa638e", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.8244619211781185, "ground_truth": 0}, {"key": "137019bb8262f8ab776ec6367a0ae4b020fa638e", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.7969253765629626, "ground_truth": 0}, {"key": "137019bb8262f8ab776ec6367a0ae4b020fa638e", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.6909762912572429, "ground_truth": 0}, {"key": "137019bb8262f8ab776ec6367a0ae4b020fa638e", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.7185943720050005, "ground_truth": 0}, {"key": "1f738e018a3a193d04ec22612e4fe6b01b4969fe", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.9207896836474527, "ground_truth": 0}, {"key": "1f738e018a3a193d04ec22612e4fe6b01b4969fe", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.9149009629560158, "ground_truth": 0}, {"key": "1f738e018a3a193d04ec22612e4fe6b01b4969fe", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.8799743785654033, "ground_truth": 0}, {"key": "1f738e018a3a193d04ec22612e4fe6b01b4969fe", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.8887587940669934, "ground_truth": 0}, {"key": "1f738e018a3a193d04ec22612e4fe6b01b4969fe", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.9294404007125333, "ground_truth": 0}, {"key": "2bb7b7d5a229ccb9c9b5b4fa1475a54297fc0a25", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.9399133519227013, "ground_truth": 0}, {"key": "2bb7b7d5a229ccb9c9b5b4fa1475a54297fc0a25", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.9635062335497032, "ground_truth": 0}, {"key": "2bb7b7d5a229ccb9c9b5b4fa1475a54297fc0a25", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.9529258214663983, "ground_truth": 0}, {"key": "2bb7b7d5a229ccb9c9b5b4fa1475a54297fc0a25", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.9515040000366276, "ground_truth": 0}, {"key": "2bb7b7d5a229ccb9c9b5b4fa1475a54297fc0a25", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.9559813457460582, "ground_truth": 0}, {"key": "c136c209869b227e534aca60b6df7e0b26bce7fe", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.8104789046355672, "ground_truth": 0}, {"key": "c136c209869b227e534aca60b6df7e0b26bce7fe", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.7786493246684821, "ground_truth": 0}, {"key": "c136c209869b227e534aca60b6df7e0b26bce7fe", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.7138307698259113, "ground_truth": 0}, {"key": "c136c209869b227e534aca60b6df7e0b26bce7fe", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.8519527884431939, "ground_truth": 0}, {"key": "c136c209869b227e534aca60b6df7e0b26bce7fe", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.8469578414503235, "ground_truth": 0}, {"key": "bfbf2be3d5b9da8425253502393528d0f95d2b5d", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.8670357673239462, "ground_truth": 0}, {"key": "bfbf2be3d5b9da8425253502393528d0f95d2b5d", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.9539660993107465, "ground_truth": 0}, {"key": "bfbf2be3d5b9da8425253502393528d0f95d2b5d", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.964051674500228, "ground_truth": 0}, {"key": "bfbf2be3d5b9da8425253502393528d0f95d2b5d", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.851952803458086, "ground_truth": 0}, {"key": "bfbf2be3d5b9da8425253502393528d0f95d2b5d", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.8469578578989685, "ground_truth": 0}, {"key": "de149988c9768a12f4a656f1d86efe42af51b4c8", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.9343951663101979, "ground_truth": 0}, {"key": "de149988c9768a12f4a656f1d86efe42af51b4c8", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.9149009515375972, "ground_truth": 0}, {"key": "de149988c9768a12f4a656f1d86efe42af51b4c8", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.942506722490179, "ground_truth": 0}, {"key": "de149988c9768a12f4a656f1d86efe42af51b4c8", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.9445872044921656, "ground_truth": 0}, {"key": "de149988c9768a12f4a656f1d86efe42af51b4c8", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.9399133537106323, "ground_truth": 0}, {"key": "45986f43dd61461844801c08c8753a71ccbf9083", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.8187368140726836, "ground_truth": 0}, {"key": "45986f43dd61461844801c08c8753a71ccbf9083", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.7341195480985401, "ground_truth": 0}, {"key": "45986f43dd61461844801c08c8753a71ccbf9083", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.7892336991997223, "ground_truth": 0}, {"key": "45986f43dd61461844801c08c8753a71ccbf9083", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.6791787106656867, "ground_truth": 0}, {"key": "45986f43dd61461844801c08c8753a71ccbf9083", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.795658114887676, "ground_truth": 0}, {"key": "e27256e1314f48219ceca70c273dd8429fc4ca4f", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.920217984124045, "ground_truth": 0}, {"key": "e27256e1314f48219ceca70c273dd8429fc4ca4f", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.8519528118918331, "ground_truth": 0}, {"key": "e27256e1314f48219ceca70c273dd8429fc4ca4f", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.8670357540105434, "ground_truth": 0}, {"key": "e27256e1314f48219ceca70c273dd8429fc4ca4f", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.8969755720198526, "ground_truth": 0}, {"key": "e27256e1314f48219ceca70c273dd8429fc4ca4f", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.8714748628273186, "ground_truth": 0}, {"key": "8da9fddf6f4a0d798e454ee7b778ce0d7ce3c447", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.8548846375125315, "ground_truth": 0}, {"key": "8da9fddf6f4a0d798e454ee7b778ce0d7ce3c447", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.9136765188728453, "ground_truth": 0}, {"key": "8da9fddf6f4a0d798e454ee7b778ce0d7ce3c447", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.9207896784009684, "ground_truth": 0}, {"key": "8da9fddf6f4a0d798e454ee7b778ce0d7ce3c447", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.8783142471332122, "ground_truth": 0}, {"key": "8da9fddf6f4a0d798e454ee7b778ce0d7ce3c447", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.9190632848233077, "ground_truth": 0}, {"key": "d2e357c372891291bbdb4f496792ea9d5807cd3a", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.9566341997995166, "ground_truth": 0}, {"key": "d2e357c372891291bbdb4f496792ea9d5807cd3a", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.9766692321887286, "ground_truth": 0}, {"key": "d2e357c372891291bbdb4f496792ea9d5807cd3a", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.9730364973630523, "ground_truth": 0}, {"key": "d2e357c372891291bbdb4f496792ea9d5807cd3a", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.9858276341964741, "ground_truth": 0}, {"key": "d2e357c372891291bbdb4f496792ea9d5807cd3a", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.9572778044497858, "ground_truth": 0}, {"key": "2a17cad6a35f54ceab81d03772a75c58aa7147ef", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.7704648061036542, "ground_truth": 0}, {"key": "2a17cad6a35f54ceab81d03772a75c58aa7147ef", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.8233283947646514, "ground_truth": 0}, {"key": "2a17cad6a35f54ceab81d03772a75c58aa7147ef", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.8991213814468876, "ground_truth": 0}, {"key": "2a17cad6a35f54ceab81d03772a75c58aa7147ef", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.8969755764924642, "ground_truth": 0}, {"key": "2a17cad6a35f54ceab81d03772a75c58aa7147ef", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.8558511487827007, "ground_truth": 0}, {"key": "4b25022fda48e7f91ab1459f1a6dca501318672e", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.8469578455215057, "ground_truth": 0}, {"key": "4b25022fda48e7f91ab1459f1a6dca501318672e", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.7648916071890509, "ground_truth": 0}, {"key": "4b25022fda48e7f91ab1459f1a6dca501318672e", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.8529354758793637, "ground_truth": 0}, {"key": "4b25022fda48e7f91ab1459f1a6dca501318672e", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.7931059462377513, "ground_truth": 0}, {"key": "4b25022fda48e7f91ab1459f1a6dca501318672e", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.8311430382616353, "ground_truth": 0}, {"key": "62066d76f4ef9e06a1129551c41371bb5d2f7465", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.9284087989241586, "ground_truth": 0}, {"key": "62066d76f4ef9e06a1129551c41371bb5d2f7465", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.9412234435737694, "ground_truth": 0}, {"key": "62066d76f4ef9e06a1129551c41371bb5d2f7465", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.9686195690203211, "ground_truth": 0}, {"key": "62066d76f4ef9e06a1129551c41371bb5d2f7465", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.9469902287884561, "ground_truth": 0}, {"key": "62066d76f4ef9e06a1129551c41371bb5d2f7465", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.9549844682221668, "ground_truth": 0}, {"key": "16c4a27e42066259797d93d5db0239bce0a15f18", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.74613898391837, "ground_truth": 0}, {"key": "16c4a27e42066259797d93d5db0239bce0a15f18", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.7217432337731353, "ground_truth": 0}, {"key": "16c4a27e42066259797d93d5db0239bce0a15f18", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.8006919899083578, "ground_truth": 0}, {"key": "16c4a27e42066259797d93d5db0239bce0a15f18", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.8397339658537442, "ground_truth": 0}, {"key": "16c4a27e42066259797d93d5db0239bce0a15f18", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.8140528155822049, "ground_truth": 0}, {"key": "8626e8d0c96f4d12eca92423e0c43c6ea3e53545", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.6424324708988929, "ground_truth": 0}, {"key": "8626e8d0c96f4d12eca92423e0c43c6ea3e53545", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.8175744607398192, "ground_truth": 0}, {"key": "8626e8d0c96f4d12eca92423e0c43c6ea3e53545", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.6959583210810056, "ground_truth": 0}, {"key": "8626e8d0c96f4d12eca92423e0c43c6ea3e53545", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.6513548584660949, "ground_truth": 0}, {"key": "8626e8d0c96f4d12eca92423e0c43c6ea3e53545", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.7310585947191016, "ground_truth": 0}, {"key": "f675d806e17d1920e6622d3a925367697c94e58e", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.8933094080106588, "ground_truth": 0}, {"key": "f675d806e17d1920e6622d3a925367697c94e58e", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.8783142305979187, "ground_truth": 0}, {"key": "f675d806e17d1920e6622d3a925367697c94e58e", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.8740772474195485, "ground_truth": 0}, {"key": "f675d806e17d1920e6622d3a925367697c94e58e", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.9079671387464768, "ground_truth": 0}, {"key": "f675d806e17d1920e6622d3a925367697c94e58e", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.7918210870375588, "ground_truth": 0}, {"key": "835b6e4637bd2c3fe2644f2cefa00270e950ebdf", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.6808786088105664, "ground_truth": 0}, {"key": "835b6e4637bd2c3fe2644f2cefa00270e950ebdf", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.7461390011777167, "ground_truth": 0}, {"key": "835b6e4637bd2c3fe2644f2cefa00270e950ebdf", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.8092759674726732, "ground_truth": 0}, {"key": "835b6e4637bd2c3fe2644f2cefa00270e950ebdf", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.7704647882589979, "ground_truth": 0}, {"key": "835b6e4637bd2c3fe2644f2cefa00270e950ebdf", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.8221891271848003, "ground_truth": 0}, {"key": "aec90720358f66b9d149db8afd08fbb821e3aa52", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.6825737116369063, "ground_truth": 0}, {"key": "aec90720358f66b9d149db8afd08fbb821e3aa52", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.6859494483436364, "ground_truth": 0}, {"key": "aec90720358f66b9d149db8afd08fbb821e3aa52", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.5234203700811277, "ground_truth": 0}, {"key": "aec90720358f66b9d149db8afd08fbb821e3aa52", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.7386690736879977, "ground_truth": 0}, {"key": "aec90720358f66b9d149db8afd08fbb821e3aa52", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.6791786855303329, "ground_truth": 0}, {"key": "0033829349643e2964a8c3ce5fd997116ce43f7c", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.9124361556509186, "ground_truth": 0}, {"key": "0033829349643e2964a8c3ce5fd997116ce43f7c", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.9385759544474586, "ground_truth": 0}, {"key": "0033829349643e2964a8c3ce5fd997116ce43f7c", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.8255897278776252, "ground_truth": 0}, {"key": "0033829349643e2964a8c3ce5fd997116ce43f7c", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.8783142570193966, "ground_truth": 0}, {"key": "0033829349643e2964a8c3ce5fd997116ce43f7c", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.9376689658259387, "ground_truth": 0}, {"key": "3276a47234f0aa9eb7d4d06940ffb912be059454", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.6548947271774433, "ground_truth": 0}, {"key": "3276a47234f0aa9eb7d4d06940ffb912be059454", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.6406358373455243, "ground_truth": 0}, {"key": "3276a47234f0aa9eb7d4d06940ffb912be059454", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.7606506470654927, "ground_truth": 0}, {"key": "3276a47234f0aa9eb7d4d06940ffb912be059454", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.8233283922446022, "ground_truth": 0}, {"key": "3276a47234f0aa9eb7d4d06940ffb912be059454", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.6688802494558872, "ground_truth": 0}, {"key": "8d3bb51d711ce00e3fff53625a70923985573834", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.8643104446898031, "ground_truth": 0}, {"key": "8d3bb51d711ce00e3fff53625a70923985573834", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.8198933388971245, "ground_truth": 0}, {"key": "8d3bb51d711ce00e3fff53625a70923985573834", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.9039745086566932, "ground_truth": 0}, {"key": "8d3bb51d711ce00e3fff53625a70923985573834", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.8568122946173989, "ground_truth": 0}, {"key": "8d3bb51d711ce00e3fff53625a70923985573834", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.8529354719241781, "ground_truth": 0}, {"key": "e43fc7e34d05a75894279f55935b25040a6d7017", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.9173026592320916, "ground_truth": 0}, {"key": "e43fc7e34d05a75894279f55935b25040a6d7017", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.8469578448680524, "ground_truth": 0}, {"key": "e43fc7e34d05a75894279f55935b25040a6d7017", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.8499711828610882, "ground_truth": 0}, {"key": "e43fc7e34d05a75894279f55935b25040a6d7017", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.8152324962784007, "ground_truth": 0}, {"key": "e43fc7e34d05a75894279f55935b25040a6d7017", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.8962513742372124, "ground_truth": 0}, {"key": "518daa3f4d9f4eb8d3e6dec7852c8b645d1ceb49", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.9099070088876217, "ground_truth": 0}, {"key": "518daa3f4d9f4eb8d3e6dec7852c8b645d1ceb49", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.9425067202733065, "ground_truth": 0}, {"key": "518daa3f4d9f4eb8d3e6dec7852c8b645d1ceb49", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.9066531252507714, "ground_truth": 0}, {"key": "518daa3f4d9f4eb8d3e6dec7852c8b645d1ceb49", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.9019206782207086, "ground_truth": 0}, {"key": "518daa3f4d9f4eb8d3e6dec7852c8b645d1ceb49", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.9230391630903635, "ground_truth": 0}, {"key": "a86f10b66912e0221e9ad4d44c37fc7f4e138ed2", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.9525741270163519, "ground_truth": 0}, {"key": "a86f10b66912e0221e9ad4d44c37fc7f4e138ed2", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.9569571497726409, "ground_truth": 0}, {"key": "a86f10b66912e0221e9ad4d44c37fc7f4e138ed2", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.9511422224969928, "ground_truth": 0}, {"key": "a86f10b66912e0221e9ad4d44c37fc7f4e138ed2", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.9637799415727324, "ground_truth": 0}, {"key": "a86f10b66912e0221e9ad4d44c37fc7f4e138ed2", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.9730364987192663, "ground_truth": 0}, {"key": "a34829c5a83a3ef39c34b57b65cc48c9bf11f14b", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.7690802298556562, "ground_truth": 0}, {"key": "a34829c5a83a3ef39c34b57b65cc48c9bf11f14b", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.6548947415110834, "ground_truth": 0}, {"key": "a34829c5a83a3ef39c34b57b65cc48c9bf11f14b", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.6791787049665824, "ground_truth": 0}, {"key": "a34829c5a83a3ef39c34b57b65cc48c9bf11f14b", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.764891625007591, "ground_truth": 0}, {"key": "a34829c5a83a3ef39c34b57b65cc48c9bf11f14b", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.818736788640611, "ground_truth": 0}, {"key": "05c6b2a21f9c0ffd5f0c76c9ce4c6d3d875fcf39", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.8068526346577772, "ground_truth": 0}, {"key": "05c6b2a21f9c0ffd5f0c76c9ce4c6d3d875fcf39", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.8895288478704704, "ground_truth": 0}, {"key": "05c6b2a21f9c0ffd5f0c76c9ce4c6d3d875fcf39", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.5851011511033897, "ground_truth": 0}, {"key": "05c6b2a21f9c0ffd5f0c76c9ce4c6d3d875fcf39", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.7718435013239409, "ground_truth": 0}, {"key": "05c6b2a21f9c0ffd5f0c76c9ce4c6d3d875fcf39", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.8128673082749007, "ground_truth": 0}, {"key": "b3e6507640b009ed51c8c8f8be85d0b7fec5b579", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.8791467688581663, "ground_truth": 0}, {"key": "b3e6507640b009ed51c8c8f8be85d0b7fec5b579", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.939913348470099, "ground_truth": 0}, {"key": "b3e6507640b009ed51c8c8f8be85d0b7fec5b579", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.9339146239389158, "ground_truth": 0}, {"key": "b3e6507640b009ed51c8c8f8be85d0b7fec5b579", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.8210441014257442, "ground_truth": 0}, {"key": "b3e6507640b009ed51c8c8f8be85d0b7fec5b579", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.911179710258565, "ground_truth": 0}, {"key": "6e930c55a62640d218e4b94f39cb7c83b6ad9117", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.6842640225341919, "ground_truth": 0}, {"key": "6e930c55a62640d218e4b94f39cb7c83b6ad9117", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.5370413752405953, "ground_truth": 0}, {"key": "6e930c55a62640d218e4b94f39cb7c83b6ad9117", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.6740504756030319, "ground_truth": 0}, {"key": "6e930c55a62640d218e4b94f39cb7c83b6ad9117", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.6992544140569597, "ground_truth": 0}, {"key": "6e930c55a62640d218e4b94f39cb7c83b6ad9117", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.6774740162262913, "ground_truth": 0}, {"key": "cd13c83364964da3b3659782e6ef0d2b3dc273b1", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.8791467623974152, "ground_truth": 0}, {"key": "cd13c83364964da3b3659782e6ef0d2b3dc273b1", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.8872046036861007, "ground_truth": 0}, {"key": "cd13c83364964da3b3659782e6ef0d2b3dc273b1", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.8539127488101982, "ground_truth": 0}, {"key": "cd13c83364964da3b3659782e6ef0d2b3dc273b1", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.9079671354051064, "ground_truth": 0}, {"key": "cd13c83364964da3b3659782e6ef0d2b3dc273b1", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.9314625034629417, "ground_truth": 0}, {"key": "328210eaa50ae54cc3d979958c1d2008faa27401", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.8984105445439322, "ground_truth": 0}, {"key": "328210eaa50ae54cc3d979958c1d2008faa27401", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.8962513644344376, "ground_truth": 0}, {"key": "328210eaa50ae54cc3d979958c1d2008faa27401", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.8816149020979531, "ground_truth": 0}, {"key": "328210eaa50ae54cc3d979958c1d2008faa27401", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.8799743716773001, "ground_truth": 0}, {"key": "328210eaa50ae54cc3d979958c1d2008faa27401", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.9178933690529698, "ground_truth": 0}, {"key": "b67b63d1da9cccd6e229d5755065d57dd1653feb", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.8705972692268086, "ground_truth": 0}, {"key": "b67b63d1da9cccd6e229d5755065d57dd1653feb", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.8848377737344028, "ground_truth": 0}, {"key": "b67b63d1da9cccd6e229d5755065d57dd1653feb", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.867933845711568, "ground_truth": 0}, {"key": "b67b63d1da9cccd6e229d5755065d57dd1653feb", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.8499711719731748, "ground_truth": 0}, {"key": "b67b63d1da9cccd6e229d5755065d57dd1653feb", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.8864204025759553, "ground_truth": 0}, {"key": "e4c55cb4bb6e5418d8486fb7c9369b6c84b2716d", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.9304582590261464, "ground_truth": 0}, {"key": "e4c55cb4bb6e5418d8486fb7c9369b6c84b2716d", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.9105453996460834, "ground_truth": 0}, {"key": "e4c55cb4bb6e5418d8486fb7c9369b6c84b2716d", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.8670357531783839, "ground_truth": 0}, {"key": "e4c55cb4bb6e5418d8486fb7c9369b6c84b2716d", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.9224823455108814, "ground_truth": 0}, {"key": "e4c55cb4bb6e5418d8486fb7c9369b6c84b2716d", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.849971173739275, "ground_truth": 0}, {"key": "544b165ad1d22a5dcbbab469a2aa7666c2868361", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.7341195303447043, "ground_truth": 0}, {"key": "544b165ad1d22a5dcbbab469a2aa7666c2868361", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.6976089336464758, "ground_truth": 0}, {"key": "544b165ad1d22a5dcbbab469a2aa7666c2868361", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.5409238877959542, "ground_truth": 0}, {"key": "544b165ad1d22a5dcbbab469a2aa7666c2868361", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.6187804246939116, "ground_truth": 0}, {"key": "544b165ad1d22a5dcbbab469a2aa7666c2868361", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.7476159619631508, "ground_truth": 0}, {"key": "2577ef64a22c06cf63cb244abfad9ecc46603208", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.762070109363773, "ground_truth": 0}, {"key": "2577ef64a22c06cf63cb244abfad9ecc46603208", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.8418256413155819, "ground_truth": 0}, {"key": "2577ef64a22c06cf63cb244abfad9ecc46603208", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.8068526271715756, "ground_truth": 0}, {"key": "2577ef64a22c06cf63cb244abfad9ecc46603208", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.7956580948348909, "ground_truth": 0}, {"key": "2577ef64a22c06cf63cb244abfad9ecc46603208", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.9161096144233505, "ground_truth": 0}, {"key": "2a73430dd3232ad3da7570a5ac133d7f29a6b6c6", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.9273633002422976, "ground_truth": 0}, {"key": "2a73430dd3232ad3da7570a5ac133d7f29a6b6c6", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.8832359812692789, "ground_truth": 0}, {"key": "2a73430dd3232ad3da7570a5ac133d7f29a6b6c6", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.94078975076843, "ground_truth": 0}, {"key": "2a73430dd3232ad3da7570a5ac133d7f29a6b6c6", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.8428631449352768, "ground_truth": 0}, {"key": "2a73430dd3232ad3da7570a5ac133d7f29a6b6c6", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.9309620788404243, "ground_truth": 0}, {"key": "8fbcaf3abc124b7baaa278d382411f43e7e48353", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.8705972659691211, "ground_truth": 0}, {"key": "8fbcaf3abc124b7baaa278d382411f43e7e48353", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.868826779604938, "ground_truth": 0}, {"key": "8fbcaf3abc124b7baaa278d382411f43e7e48353", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.8947894687548971, "ground_truth": 0}, {"key": "8fbcaf3abc124b7baaa278d382411f43e7e48353", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.9549844640516192, "ground_truth": 0}, {"key": "8fbcaf3abc124b7baaa278d382411f43e7e48353", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.8872046016031, "ground_truth": 0}, {"key": "bc04e5a298854589044eb5a162f281f3e7e12c16", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.6076631653113675, "ground_truth": 0}, {"key": "bc04e5a298854589044eb5a162f281f3e7e12c16", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.6132365680962385, "ground_truth": 0}, {"key": "bc04e5a298854589044eb5a162f281f3e7e12c16", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.5945512696588725, "ground_truth": 0}, {"key": "bc04e5a298854589044eb5a162f281f3e7e12c16", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.5717666072853608, "ground_truth": 0}, {"key": "bc04e5a298854589044eb5a162f281f3e7e12c16", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.6825737092911065, "ground_truth": 0}, {"key": "8c3b7358950d0684a90736fc39d08340d3ec41ee", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.8407825893521532, "ground_truth": 0}, {"key": "8c3b7358950d0684a90736fc39d08340d3ec41ee", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.8322366512399056, "ground_truth": 0}, {"key": "8c3b7358950d0684a90736fc39d08340d3ec41ee", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.6531269122965625, "ground_truth": 0}, {"key": "8c3b7358950d0684a90736fc39d08340d3ec41ee", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.7826624715274982, "ground_truth": 0}, {"key": "8c3b7358950d0684a90736fc39d08340d3ec41ee", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.7325918200658545, "ground_truth": 0}, {"key": "d1a86381ca59e3471d2863688229922f83218150", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.791821070457669, "ground_truth": 0}, {"key": "d1a86381ca59e3471d2863688229922f83218150", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.865224082862448, "ground_truth": 0}, {"key": "d1a86381ca59e3471d2863688229922f83218150", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.8438950932231132, "ground_truth": 0}, {"key": "d1a86381ca59e3471d2863688229922f83218150", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.8175744769334159, "ground_truth": 0}, {"key": "d1a86381ca59e3471d2863688229922f83218150", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.9086178979687889, "ground_truth": 0}, {"key": "313d98f4c6047ff556795b6da47e42e9f650946a", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.6619228553018962, "ground_truth": 0}, {"key": "313d98f4c6047ff556795b6da47e42e9f650946a", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.7577943688426129, "ground_truth": 0}, {"key": "313d98f4c6047ff556795b6da47e42e9f650946a", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.6671476640740811, "ground_truth": 0}, {"key": "313d98f4c6047ff556795b6da47e42e9f650946a", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.6076631720850904, "ground_truth": 0}, {"key": "313d98f4c6047ff556795b6da47e42e9f650946a", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.823328396741704, "ground_truth": 0}, {"key": "8c0934c689bbc9234dc51eff9d8d156aec106ca4", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.741674005707792, "ground_truth": 0}, {"key": "8c0934c689bbc9234dc51eff9d8d156aec106ca4", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.8998277760946713, "ground_truth": 0}, {"key": "8c0934c689bbc9234dc51eff9d8d156aec106ca4", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.8548846405788475, "ground_truth": 0}, {"key": "8c0934c689bbc9234dc51eff9d8d156aec106ca4", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.8267118133647637, "ground_truth": 0}, {"key": "8c0934c689bbc9234dc51eff9d8d156aec106ca4", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.8740772375855261, "ground_truth": 0}, {"key": "70f210b63211c32ab22354506b7bd9b80ee194af", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.8233283900081687, "ground_truth": 0}, {"key": "70f210b63211c32ab22354506b7bd9b80ee194af", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.8092759686626305, "ground_truth": 0}, {"key": "70f210b63211c32ab22354506b7bd9b80ee194af", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.8688267731062577, "ground_truth": 0}, {"key": "70f210b63211c32ab22354506b7bd9b80ee194af", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.7943849571160007, "ground_truth": 0}, {"key": "70f210b63211c32ab22354506b7bd9b80ee194af", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.8233283901794257, "ground_truth": 0}, {"key": "dea4bf4a53b568dea8b3d5009a24d090485be8c9", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.871474865182261, "ground_truth": 0}, {"key": "dea4bf4a53b568dea8b3d5009a24d090485be8c9", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.7981867777425143, "ground_truth": 0}, {"key": "dea4bf4a53b568dea8b3d5009a24d090485be8c9", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.7690802194715504, "ground_truth": 0}, {"key": "dea4bf4a53b568dea8b3d5009a24d090485be8c9", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.8289388124497695, "ground_truth": 0}, {"key": "dea4bf4a53b568dea8b3d5009a24d090485be8c9", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.7892337005183012, "ground_truth": 0}, {"key": "3ffb4210cf832dc039ffe7522c47c6eb7a5e5ab5", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.6113819526829714, "ground_truth": 0}, {"key": "3ffb4210cf832dc039ffe7522c47c6eb7a5e5ab5", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.7994423189879089, "ground_truth": 0}, {"key": "3ffb4210cf832dc039ffe7522c47c6eb7a5e5ab5", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.7461389831272651, "ground_truth": 0}, {"key": "3ffb4210cf832dc039ffe7522c47c6eb7a5e5ab5", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.7745833891863869, "ground_truth": 0}, {"key": "3ffb4210cf832dc039ffe7522c47c6eb7a5e5ab5", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.8449215432529117, "ground_truth": 0}, {"key": "c010d72bf64ac4e1c758b7f078aeed89bc57a9db", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.7592254006337724, "ground_truth": 0}, {"key": "c010d72bf64ac4e1c758b7f078aeed89bc57a9db", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.7356416460232598, "ground_truth": 0}, {"key": "c010d72bf64ac4e1c758b7f078aeed89bc57a9db", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.7662936460738355, "ground_truth": 0}, {"key": "c010d72bf64ac4e1c758b7f078aeed89bc57a9db", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.8267118007611752, "ground_truth": 0}, {"key": "c010d72bf64ac4e1c758b7f078aeed89bc57a9db", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.8019358253046601, "ground_truth": 0}, {"key": "343644770a597a2dfa7548ba165fa9c6bdc88245", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.8278281536120313, "ground_truth": 0}, {"key": "343644770a597a2dfa7548ba165fa9c6bdc88245", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.7981867782371049, "ground_truth": 0}, {"key": "343644770a597a2dfa7548ba165fa9c6bdc88245", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.8044059204533972, "ground_truth": 0}, {"key": "343644770a597a2dfa7548ba165fa9c6bdc88245", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.8210441082488722, "ground_truth": 0}, {"key": "343644770a597a2dfa7548ba165fa9c6bdc88245", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.8774767874350161, "ground_truth": 0}, {"key": "4b89e8a6a25de61d21a1fed20fb911cd4b1e4b47", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.7759445529657953, "ground_truth": 0}, {"key": "4b89e8a6a25de61d21a1fed20fb911cd4b1e4b47", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.7371581667162184, "ground_truth": 0}, {"key": "4b89e8a6a25de61d21a1fed20fb911cd4b1e4b47", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.7025300430187068, "ground_truth": 0}, {"key": "4b89e8a6a25de61d21a1fed20fb911cd4b1e4b47", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.6636689552384443, "ground_truth": 0}, {"key": "4b89e8a6a25de61d21a1fed20fb911cd4b1e4b47", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.7248702779551985, "ground_truth": 0}, {"key": "9b382d27692cb18aa61af350038b175b3ce75e2b", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.6723316933599375, "ground_truth": 0}, {"key": "9b382d27692cb18aa61af350038b175b3ce75e2b", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.779992912101405, "ground_truth": 0}, {"key": "9b382d27692cb18aa61af350038b175b3ce75e2b", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.8031737883295293, "ground_truth": 0}, {"key": "9b382d27692cb18aa61af350038b175b3ce75e2b", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.684264015033114, "ground_truth": 0}, {"key": "9b382d27692cb18aa61af350038b175b3ce75e2b", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.7943849598200391, "ground_truth": 0}, {"key": "59be27355e5b86754678f70254cfbb1e6dc8bf0c", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.7549149861693695, "ground_truth": 0}, {"key": "59be27355e5b86754678f70254cfbb1e6dc8bf0c", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.7008948024629286, "ground_truth": 0}, {"key": "59be27355e5b86754678f70254cfbb1e6dc8bf0c", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.6370307812342338, "ground_truth": 0}, {"key": "59be27355e5b86754678f70254cfbb1e6dc8bf0c", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.7826624744340344, "ground_truth": 0}, {"key": "59be27355e5b86754678f70254cfbb1e6dc8bf0c", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.8244619272732169, "ground_truth": 0}, {"key": "ff10934c1dc127286575fb1a6b192da6da21f235", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.8221891354059874, "ground_truth": 0}, {"key": "ff10934c1dc127286575fb1a6b192da6da21f235", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.8670357524989762, "ground_truth": 0}, {"key": "ff10934c1dc127286575fb1a6b192da6da21f235", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.6992544287412019, "ground_truth": 0}, {"key": "ff10934c1dc127286575fb1a6b192da6da21f235", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.879146768549037, "ground_truth": 0}, {"key": "ff10934c1dc127286575fb1a6b192da6da21f235", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.7786493110452771, "ground_truth": 0}, {"key": "1997690ceabc952c3396cb2a30e9050241f6f6c7", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.8198933361553478, "ground_truth": 0}, {"key": "1997690ceabc952c3396cb2a30e9050241f6f6c7", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.7122321794624925, "ground_truth": 0}, {"key": "1997690ceabc952c3396cb2a30e9050241f6f6c7", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.7704647906565738, "ground_truth": 0}, {"key": "1997690ceabc952c3396cb2a30e9050241f6f6c7", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.7264255935002568, "ground_truth": 0}, {"key": "1997690ceabc952c3396cb2a30e9050241f6f6c7", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.7799929109701726, "ground_truth": 0}, {"key": "c676027eea6109621206e3864c4eea30912fe09f", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.8175744695213121, "ground_truth": 0}, {"key": "c676027eea6109621206e3864c4eea30912fe09f", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.8529354735118377, "ground_truth": 0}, {"key": "c676027eea6109621206e3864c4eea30912fe09f", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.7386690838599241, "ground_truth": 0}, {"key": "c676027eea6109621206e3864c4eea30912fe09f", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.7786493230143022, "ground_truth": 0}, {"key": "c676027eea6109621206e3864c4eea30912fe09f", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.7981867734317056, "ground_truth": 0}, {"key": "78e22dd79495204cf719e3728927241bb60b80e1", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.8386797655644523, "ground_truth": 0}, {"key": "78e22dd79495204cf719e3728927241bb60b80e1", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.7704647932322726, "ground_truth": 0}, {"key": "78e22dd79495204cf719e3728927241bb60b80e1", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.7931059570679321, "ground_truth": 0}, {"key": "78e22dd79495204cf719e3728927241bb60b80e1", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.8354835406377659, "ground_truth": 0}, {"key": "78e22dd79495204cf719e3728927241bb60b80e1", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.8289388194331632, "ground_truth": 0}, {"key": "6c1a1cf59028ba2567b0a1941e510c40133da1c0", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.9235923210420924, "ground_truth": 0}, {"key": "6c1a1cf59028ba2567b0a1941e510c40133da1c0", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.9645892728455713, "ground_truth": 0}, {"key": "6c1a1cf59028ba2567b0a1941e510c40133da1c0", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.9416541596941087, "ground_truth": 0}, {"key": "6c1a1cf59028ba2567b0a1941e510c40133da1c0", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.931959575592128, "ground_truth": 0}, {"key": "6c1a1cf59028ba2567b0a1941e510c40133da1c0", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.9420819106172503, "ground_truth": 0}, {"key": "e8bbd5a77edf96611a4b8efcfbc625ec65985e98", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.8489721957015597, "ground_truth": 0}, {"key": "e8bbd5a77edf96611a4b8efcfbc625ec65985e98", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.8955226753555469, "ground_truth": 0}, {"key": "e8bbd5a77edf96611a4b8efcfbc625ec65985e98", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.9086178881508101, "ground_truth": 0}, {"key": "e8bbd5a77edf96611a4b8efcfbc625ec65985e98", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.8856314732491997, "ground_truth": 0}, {"key": "e8bbd5a77edf96611a4b8efcfbc625ec65985e98", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.9416541607433762, "ground_truth": 0}, {"key": "4141e012912dbf29c5e792b8654a9a36094b468c", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.8489722131195088, "ground_truth": 0}, {"key": "4141e012912dbf29c5e792b8654a9a36094b468c", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.8418256419382694, "ground_truth": 0}, {"key": "4141e012912dbf29c5e792b8654a9a36094b468c", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.7634837518817006, "ground_truth": 0}, {"key": "4141e012912dbf29c5e792b8654a9a36094b468c", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.8568123026897554, "ground_truth": 0}, {"key": "4141e012912dbf29c5e792b8654a9a36094b468c", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.6548947479032303, "ground_truth": 0}, {"key": "d80fa94dc14601e4b82321e2cf749d6915251a70", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.8407826000817606, "ground_truth": 0}, {"key": "d80fa94dc14601e4b82321e2cf749d6915251a70", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.8633916015577366, "ground_truth": 0}, {"key": "d80fa94dc14601e4b82321e2cf749d6915251a70", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.7676898584165354, "ground_truth": 0}, {"key": "d80fa94dc14601e4b82321e2cf749d6915251a70", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.8615382149232858, "ground_truth": 0}, {"key": "d80fa94dc14601e4b82321e2cf749d6915251a70", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.8322366495453611, "ground_truth": 0}, {"key": "11e57b8ed79c4f4b110d81a5cd7152d42411c7a6", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.9130583434517889, "ground_truth": 0}, {"key": "11e57b8ed79c4f4b110d81a5cd7152d42411c7a6", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.7931059573793923, "ground_truth": 0}, {"key": "11e57b8ed79c4f4b110d81a5cd7152d42411c7a6", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.8568122963803879, "ground_truth": 0}, {"key": "11e57b8ed79c4f4b110d81a5cd7152d42411c7a6", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.8670357640109891, "ground_truth": 0}, {"key": "11e57b8ed79c4f4b110d81a5cd7152d42411c7a6", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.799442321670246, "ground_truth": 0}, {"key": "b55c390e81c5d1d4fa077338d9daaed8978f710b", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.8624675277410853, "ground_truth": 0}, {"key": "b55c390e81c5d1d4fa077338d9daaed8978f710b", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.8568122886717854, "ground_truth": 0}, {"key": "b55c390e81c5d1d4fa077338d9daaed8978f710b", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.8933094015047964, "ground_truth": 0}, {"key": "b55c390e81c5d1d4fa077338d9daaed8978f710b", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.8766343686707331, "ground_truth": 0}, {"key": "b55c390e81c5d1d4fa077338d9daaed8978f710b", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.9161096133107001, "ground_truth": 0}, {"key": "d46e1849cbbf875ccd018fd778fa6c433cab4694", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.8872045929529196, "ground_truth": 0}, {"key": "d46e1849cbbf875ccd018fd778fa6c433cab4694", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.7606506428855244, "ground_truth": 0}, {"key": "d46e1849cbbf875ccd018fd778fa6c433cab4694", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.6825737625615214, "ground_truth": 0}, {"key": "d46e1849cbbf875ccd018fd778fa6c433cab4694", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.8322366545518692, "ground_truth": 0}, {"key": "d46e1849cbbf875ccd018fd778fa6c433cab4694", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.8031737983590199, "ground_truth": 0}, {"key": "09b582acc63514f671628e1766ff7e99b258fe9a", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.8670357516142126, "ground_truth": 0}, {"key": "09b582acc63514f671628e1766ff7e99b258fe9a", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.7520125667235165, "ground_truth": 0}, {"key": "09b582acc63514f671628e1766ff7e99b258fe9a", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.8705972750175939, "ground_truth": 0}, {"key": "09b582acc63514f671628e1766ff7e99b258fe9a", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.8856314742955437, "ground_truth": 0}, {"key": "09b582acc63514f671628e1766ff7e99b258fe9a", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.8539127471847758, "ground_truth": 0}, {"key": "c4afe4db222c094c40bb3f271e37e006bcbebf88", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.7786493003418908, "ground_truth": 0}, {"key": "c4afe4db222c094c40bb3f271e37e006bcbebf88", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.6636689379932126, "ground_truth": 0}, {"key": "c4afe4db222c094c40bb3f271e37e006bcbebf88", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.7759445450893134, "ground_truth": 0}, {"key": "c4afe4db222c094c40bb3f271e37e006bcbebf88", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.6909763157433129, "ground_truth": 0}, {"key": "c4afe4db222c094c40bb3f271e37e006bcbebf88", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.6424324680549294, "ground_truth": 0}, {"key": "e21871892c63ec9638bf1bd3c3a1c3ebdae88796", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.9196425386801226, "ground_truth": 0}, {"key": "e21871892c63ec9638bf1bd3c3a1c3ebdae88796", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.9099070046227572, "ground_truth": 0}, {"key": "e21871892c63ec9638bf1bd3c3a1c3ebdae88796", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.905322291571122, "ground_truth": 0}, {"key": "e21871892c63ec9638bf1bd3c3a1c3ebdae88796", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.8791467589027122, "ground_truth": 0}, {"key": "e21871892c63ec9638bf1bd3c3a1c3ebdae88796", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.8679338475285361, "ground_truth": 0}, {"key": "065378e265a6d5ff38b2e6748ba66490cf8670a9", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.862467527807876, "ground_truth": 0}, {"key": "065378e265a6d5ff38b2e6748ba66490cf8670a9", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.7826624826962795, "ground_truth": 0}, {"key": "065378e265a6d5ff38b2e6748ba66490cf8670a9", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.8509646981081995, "ground_truth": 0}, {"key": "065378e265a6d5ff38b2e6748ba66490cf8670a9", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.727975441550234, "ground_truth": 0}, {"key": "065378e265a6d5ff38b2e6748ba66490cf8670a9", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.9136765252905041, "ground_truth": 0}, {"key": "5852e143b34cc30e94aed29193fc2e1dce37b1b1", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.7745833882543793, "ground_truth": 0}, {"key": "5852e143b34cc30e94aed29193fc2e1dce37b1b1", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.8558511642601299, "ground_truth": 0}, {"key": "5852e143b34cc30e94aed29193fc2e1dce37b1b1", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.7520125577967124, "ground_truth": 0}, {"key": "5852e143b34cc30e94aed29193fc2e1dce37b1b1", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.6909762758895311, "ground_truth": 0}, {"key": "5852e143b34cc30e94aed29193fc2e1dce37b1b1", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.7732163535268941, "ground_truth": 0}, {"key": "af76b4c33b65666487dcc07f75d37de03ff61207", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.6740504897641487, "ground_truth": 0}, {"key": "af76b4c33b65666487dcc07f75d37de03ff61207", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.8774767818352046, "ground_truth": 0}, {"key": "af76b4c33b65666487dcc07f75d37de03ff61207", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.7813306277003902, "ground_truth": 0}, {"key": "af76b4c33b65666487dcc07f75d37de03ff61207", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.8278281397297552, "ground_truth": 0}, {"key": "af76b4c33b65666487dcc07f75d37de03ff61207", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.6654105531102895, "ground_truth": 0}, {"key": "9918924dbaed44429c58ea3638c3847317b71127", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.6039318347536344, "ground_truth": 0}, {"key": "9918924dbaed44429c58ea3638c3847317b71127", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.7994423225005017, "ground_truth": 0}, {"key": "9918924dbaed44429c58ea3638c3847317b71127", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.6959583092289416, "ground_truth": 0}, {"key": "9918924dbaed44429c58ea3638c3847317b71127", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.6774740390784371, "ground_truth": 0}, {"key": "9918924dbaed44429c58ea3638c3847317b71127", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.7839884465041309, "ground_truth": 0}, {"key": "c87e99f422b46c03ce77e7cd064bff87c076e1ed", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.7106282928277962, "ground_truth": 0}, {"key": "c87e99f422b46c03ce77e7cd064bff87c076e1ed", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.7826624942845892, "ground_truth": 0}, {"key": "c87e99f422b46c03ce77e7cd064bff87c076e1ed", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.6992544118880715, "ground_truth": 0}, {"key": "c87e99f422b46c03ce77e7cd064bff87c076e1ed", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.6388352709934075, "ground_truth": 0}, {"key": "c87e99f422b46c03ce77e7cd064bff87c076e1ed", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.6406358557510795, "ground_truth": 0}, {"key": "aaca402152fbea1b16e14999374f6394520289a8", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.8697145854999879, "ground_truth": 0}, {"key": "aaca402152fbea1b16e14999374f6394520289a8", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.9026095999763459, "ground_truth": 0}, {"key": "aaca402152fbea1b16e14999374f6394520289a8", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.9268352813534441, "ground_truth": 0}, {"key": "aaca402152fbea1b16e14999374f6394520289a8", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.8902942280966223, "ground_truth": 0}, {"key": "aaca402152fbea1b16e14999374f6394520289a8", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.8969755712283518, "ground_truth": 0}, {"key": "259d8cccfcb9b9edc00d757ec6efecde6fc06110", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.660172408501868, "ground_truth": 0}, {"key": "259d8cccfcb9b9edc00d757ec6efecde6fc06110", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.7772998509816023, "ground_truth": 0}, {"key": "259d8cccfcb9b9edc00d757ec6efecde6fc06110", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.7994423285670615, "ground_truth": 0}, {"key": "259d8cccfcb9b9edc00d757ec6efecde6fc06110", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.6261241838748642, "ground_truth": 0}, {"key": "259d8cccfcb9b9edc00d757ec6efecde6fc06110", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.6566582883872347, "ground_truth": 0}, {"key": "d076dbce6e84b20153db61c809d0f01f46ef1f45", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.8344068969669826, "ground_truth": 0}, {"key": "d076dbce6e84b20153db61c809d0f01f46ef1f45", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.8749346171372249, "ground_truth": 0}, {"key": "d076dbce6e84b20153db61c809d0f01f46ef1f45", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.7577943671213457, "ground_truth": 0}, {"key": "d076dbce6e84b20153db61c809d0f01f46ef1f45", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.8344068872954495, "ground_truth": 0}, {"key": "d076dbce6e84b20153db61c809d0f01f46ef1f45", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.8175744839945992, "ground_truth": 0}, {"key": "c74e983d24450ed9c4ba3a97e345bba707d26853", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.7520125682270087, "ground_truth": 0}, {"key": "c74e983d24450ed9c4ba3a97e345bba707d26853", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.8376199674932469, "ground_truth": 0}, {"key": "c74e983d24450ed9c4ba3a97e345bba707d26853", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.7563575575912279, "ground_truth": 0}, {"key": "c74e983d24450ed9c4ba3a97e345bba707d26853", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.7839884605641584, "ground_truth": 0}, {"key": "c74e983d24450ed9c4ba3a97e345bba707d26853", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.8529354869524667, "ground_truth": 0}, {"key": "0922357b2d0439cf4ba6ec9dc143e11a38b49d8a", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.7918210548061413, "ground_truth": 0}, {"key": "0922357b2d0439cf4ba6ec9dc143e11a38b49d8a", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.781330606280645, "ground_truth": 0}, {"key": "0922357b2d0439cf4ba6ec9dc143e11a38b49d8a", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.8300437706032175, "ground_truth": 0}, {"key": "0922357b2d0439cf4ba6ec9dc143e11a38b49d8a", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.7786493249776872, "ground_truth": 0}, {"key": "0922357b2d0439cf4ba6ec9dc143e11a38b49d8a", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.7341194975461504, "ground_truth": 0}, {"key": "c62ea6aaf31a7f5b6a7c2eac7780c86f9baed786", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.7772998514442512, "ground_truth": 0}, {"key": "c62ea6aaf31a7f5b6a7c2eac7780c86f9baed786", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.8548846336330808, "ground_truth": 0}, {"key": "c62ea6aaf31a7f5b6a7c2eac7780c86f9baed786", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.5832033761202008, "ground_truth": 0}, {"key": "c62ea6aaf31a7f5b6a7c2eac7780c86f9baed786", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.7813306189304199, "ground_truth": 0}, {"key": "c62ea6aaf31a7f5b6a7c2eac7780c86f9baed786", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.7401743634709865, "ground_truth": 0}, {"key": "6bb04883f35820a450ff821eda46a4002c0fc7e9", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.8397339735774089, "ground_truth": 0}, {"key": "6bb04883f35820a450ff821eda46a4002c0fc7e9", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.5544704597564006, "ground_truth": 0}, {"key": "6bb04883f35820a450ff821eda46a4002c0fc7e9", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.8278281576620174, "ground_truth": 0}, {"key": "6bb04883f35820a450ff821eda46a4002c0fc7e9", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.8732148360941412, "ground_truth": 0}, {"key": "6bb04883f35820a450ff821eda46a4002c0fc7e9", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.7892336906373443, "ground_truth": 0}, {"key": "71f87a7cbda73f1c0656d811b0026437e4ee4aa0", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.8333246012245326, "ground_truth": 0}, {"key": "71f87a7cbda73f1c0656d811b0026437e4ee4aa0", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.7994423245264594, "ground_truth": 0}, {"key": "71f87a7cbda73f1c0656d811b0026437e4ee4aa0", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.789233706046437, "ground_truth": 0}, {"key": "71f87a7cbda73f1c0656d811b0026437e4ee4aa0", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.8322366592200992, "ground_truth": 0}, {"key": "71f87a7cbda73f1c0656d811b0026437e4ee4aa0", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.8289388105785853, "ground_truth": 0}, {"key": "fa5089d759a9fb810d28c140cf60e3a5fffff8ba", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.8652240732414608, "ground_truth": 0}, {"key": "fa5089d759a9fb810d28c140cf60e3a5fffff8ba", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.7981867885783474, "ground_truth": 0}, {"key": "fa5089d759a9fb810d28c140cf60e3a5fffff8ba", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.8140528001004292, "ground_truth": 0}, {"key": "fa5089d759a9fb810d28c140cf60e3a5fffff8ba", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.7648916052542849, "ground_truth": 0}, {"key": "fa5089d759a9fb810d28c140cf60e3a5fffff8ba", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.7690802502987679, "ground_truth": 0}, {"key": "1f9aed77465301d7f3787a29555754a03728c4b7", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.8221891245248204, "ground_truth": 0}, {"key": "1f9aed77465301d7f3787a29555754a03728c4b7", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.679178708993387, "ground_truth": 0}, {"key": "1f9aed77465301d7f3787a29555754a03728c4b7", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.752012568922284, "ground_truth": 0}, {"key": "1f9aed77465301d7f3787a29555754a03728c4b7", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.764891614449644, "ground_truth": 0}, {"key": "1f9aed77465301d7f3787a29555754a03728c4b7", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.680878627863011, "ground_truth": 0}, {"key": "7237201bcb7291f2ededb818f901a451356db34b", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.7759445497200873, "ground_truth": 0}, {"key": "7237201bcb7291f2ededb818f901a451356db34b", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.8300437589384473, "ground_truth": 0}, {"key": "7237201bcb7291f2ededb818f901a451356db34b", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.8679338503819409, "ground_truth": 0}, {"key": "7237201bcb7291f2ededb818f901a451356db34b", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.6723316999555341, "ground_truth": 0}, {"key": "7237201bcb7291f2ededb818f901a451356db34b", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.8714748549665923, "ground_truth": 0}, {"key": "38d13d78fedc889784ffb3cb213a758c758be145", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.6315942980301301, "ground_truth": 0}, {"key": "38d13d78fedc889784ffb3cb213a758c758be145", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.781330606280645, "ground_truth": 0}, {"key": "38d13d78fedc889784ffb3cb213a758c758be145", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.826711791419279, "ground_truth": 0}, {"key": "38d13d78fedc889784ffb3cb213a758c758be145", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.6334102469197724, "ground_truth": 0}, {"key": "38d13d78fedc889784ffb3cb213a758c758be145", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.7648916301405237, "ground_truth": 0}, {"key": "98fd4b91ec12241a96493471a3e21c9ab96ec523", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.8757869956490185, "ground_truth": 0}, {"key": "98fd4b91ec12241a96493471a3e21c9ab96ec523", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.937668967970118, "ground_truth": 0}, {"key": "98fd4b91ec12241a96493471a3e21c9ab96ec523", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.9257686357885897, "ground_truth": 0}, {"key": "98fd4b91ec12241a96493471a3e21c9ab96ec523", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.9207896702371786, "ground_truth": 0}, {"key": "98fd4b91ec12241a96493471a3e21c9ab96ec523", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.916109619507757, "ground_truth": 0}, {"key": "8cefdd23a829375abeb18b9bd44bb053a67dfdf8", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.731058591959501, "ground_truth": 0}, {"key": "8cefdd23a829375abeb18b9bd44bb053a67dfdf8", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.7690802159739146, "ground_truth": 0}, {"key": "8cefdd23a829375abeb18b9bd44bb053a67dfdf8", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.7217432142454158, "ground_truth": 0}, {"key": "8cefdd23a829375abeb18b9bd44bb053a67dfdf8", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.7325918097646994, "ground_truth": 0}, {"key": "8cefdd23a829375abeb18b9bd44bb053a67dfdf8", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.7648915940753598, "ground_truth": 0}, {"key": "3de916a84cae6c1dee0076f4e5d6e26fc95c3242", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.7662936484623912, "ground_truth": 0}, {"key": "3de916a84cae6c1dee0076f4e5d6e26fc95c3242", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.6723317272212447, "ground_truth": 0}, {"key": "3de916a84cae6c1dee0076f4e5d6e26fc95c3242", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.8056322026476466, "ground_truth": 0}, {"key": "3de916a84cae6c1dee0076f4e5d6e26fc95c3242", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.7416740161721326, "ground_truth": 0}, {"key": "3de916a84cae6c1dee0076f4e5d6e26fc95c3242", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.747615947642595, "ground_truth": 0}, {"key": "24611abacb038c28a84c76b10165e474ac0fdd7e", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.900529785435776, "ground_truth": 0}, {"key": "24611abacb038c28a84c76b10165e474ac0fdd7e", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.933430815484205, "ground_truth": 0}, {"key": "24611abacb038c28a84c76b10165e474ac0fdd7e", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.8732148200173075, "ground_truth": 0}, {"key": "24611abacb038c28a84c76b10165e474ac0fdd7e", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.8697145778273019, "ground_truth": 0}, {"key": "24611abacb038c28a84c76b10165e474ac0fdd7e", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.8615382093993655, "ground_truth": 0}, {"key": "4f3178963b84a0e3625f7486b045872c665073d7", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.7592254076604092, "ground_truth": 0}, {"key": "4f3178963b84a0e3625f7486b045872c665073d7", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.8449215206717603, "ground_truth": 0}, {"key": "4f3178963b84a0e3625f7486b045872c665073d7", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.6992544185839188, "ground_truth": 0}, {"key": "4f3178963b84a0e3625f7486b045872c665073d7", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.8615382108532572, "ground_truth": 0}, {"key": "4f3178963b84a0e3625f7486b045872c665073d7", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.8723473851377225, "ground_truth": 0}, {"key": "6ff0470115b556c80229f4305c23afa683c9f8da", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.8740772234918696, "ground_truth": 0}, {"key": "6ff0470115b556c80229f4305c23afa683c9f8da", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.8267117819424404, "ground_truth": 0}, {"key": "6ff0470115b556c80229f4305c23afa683c9f8da", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.7233094684587086, "ground_truth": 0}, {"key": "6ff0470115b556c80229f4305c23afa683c9f8da", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.8140527875496157, "ground_truth": 0}, {"key": "6ff0470115b556c80229f4305c23afa683c9f8da", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.8031737909275259, "ground_truth": 0}, {"key": "4be9a7e5e9115eb681541c4a8d247ac84f0eb774", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.8840392784983504, "ground_truth": 0}, {"key": "4be9a7e5e9115eb681541c4a8d247ac84f0eb774", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.8879840502496215, "ground_truth": 0}, {"key": "4be9a7e5e9115eb681541c4a8d247ac84f0eb774", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.8766343875827441, "ground_truth": 0}, {"key": "4be9a7e5e9115eb681541c4a8d247ac84f0eb774", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.9032941987939921, "ground_truth": 0}, {"key": "4be9a7e5e9115eb681541c4a8d247ac84f0eb774", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.8643104597665084, "ground_truth": 0}, {"key": "de3ba4e29501a10effcbb5a61e7b9c0ab3721669", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.8714748649636844, "ground_truth": 0}, {"key": "de3ba4e29501a10effcbb5a61e7b9c0ab3721669", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.9525741251180385, "ground_truth": 0}, {"key": "de3ba4e29501a10effcbb5a61e7b9c0ab3721669", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.9066531272280516, "ground_truth": 0}, {"key": "de3ba4e29501a10effcbb5a61e7b9c0ab3721669", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.8807970752951191, "ground_truth": 0}, {"key": "de3ba4e29501a10effcbb5a61e7b9c0ab3721669", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.9142907194477886, "ground_truth": 0}, {"key": "d23090b75384c925e7f20b1ec5218394b52eae38", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.867035749384961, "ground_truth": 0}, {"key": "d23090b75384c925e7f20b1ec5218394b52eae38", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.8529354710283372, "ground_truth": 0}, {"key": "d23090b75384c925e7f20b1ec5218394b52eae38", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.8918110429830982, "ground_truth": 0}, {"key": "d23090b75384c925e7f20b1ec5218394b52eae38", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.9111797156732045, "ground_truth": 0}, {"key": "d23090b75384c925e7f20b1ec5218394b52eae38", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.8955226845147175, "ground_truth": 0}, {"key": "98008fdd5ea99bc7c437d6e1aa86c750bf667415", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.8529354711665746, "ground_truth": 0}, {"key": "98008fdd5ea99bc7c437d6e1aa86c750bf667415", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.6279512270527781, "ground_truth": 0}, {"key": "98008fdd5ea99bc7c437d6e1aa86c750bf667415", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.7549149919122553, "ground_truth": 0}, {"key": "98008fdd5ea99bc7c437d6e1aa86c750bf667415", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.6654105436827756, "ground_truth": 0}, {"key": "98008fdd5ea99bc7c437d6e1aa86c750bf667415", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.7401743410444374, "ground_truth": 0}, {"key": "fd13c81373473f862d0f3559ffbc2a03fa95f492", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.43782351732835467, "ground_truth": 0}, {"key": "fd13c81373473f862d0f3559ffbc2a03fa95f492", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.567936579520597, "ground_truth": 0}, {"key": "fd13c81373473f862d0f3559ffbc2a03fa95f492", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.513668445497157, "ground_truth": 0}, {"key": "fd13c81373473f862d0f3559ffbc2a03fa95f492", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.7446563211032413, "ground_truth": 0}, {"key": "fd13c81373473f862d0f3559ffbc2a03fa95f492", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.5253688340858245, "ground_truth": 0}, {"key": "ad275932d9fb03762cc781e06955fb088e165ad9", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.8333245983126383, "ground_truth": 0}, {"key": "ad275932d9fb03762cc781e06955fb088e165ad9", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.6791786965207596, "ground_truth": 0}, {"key": "ad275932d9fb03762cc781e06955fb088e165ad9", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.9196425250964916, "ground_truth": 0}, {"key": "ad275932d9fb03762cc781e06955fb088e165ad9", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.8140528186211864, "ground_truth": 0}, {"key": "ad275932d9fb03762cc781e06955fb088e165ad9", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.7745833757505655, "ground_truth": 0}, {"key": "f9fedde4734d8ac3431c0ed5d338efcd799b1aea", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.8499711795158419, "ground_truth": 0}, {"key": "f9fedde4734d8ac3431c0ed5d338efcd799b1aea", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.766293647693152, "ground_truth": 0}, {"key": "f9fedde4734d8ac3431c0ed5d338efcd799b1aea", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.8723473791765216, "ground_truth": 0}, {"key": "f9fedde4734d8ac3431c0ed5d338efcd799b1aea", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.7549149904659495, "ground_truth": 0}, {"key": "f9fedde4734d8ac3431c0ed5d338efcd799b1aea", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.8872045962837422, "ground_truth": 0}, {"key": "bbe84a85e38aac4e2cff76da7ce4ed349474db25", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.8519528085831298, "ground_truth": 0}, {"key": "bbe84a85e38aac4e2cff76da7ce4ed349474db25", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.8757869937435394, "ground_truth": 0}, {"key": "bbe84a85e38aac4e2cff76da7ce4ed349474db25", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.7592254103789328, "ground_truth": 0}, {"key": "bbe84a85e38aac4e2cff76da7ce4ed349474db25", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.766293654207279, "ground_truth": 0}, {"key": "bbe84a85e38aac4e2cff76da7ce4ed349474db25", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.8418256563681185, "ground_truth": 0}, {"key": "45884af9aff9abf54fec27f510c3f9ed000fc6e1", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.8799743678852469, "ground_truth": 0}, {"key": "45884af9aff9abf54fec27f510c3f9ed000fc6e1", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.8244619312453102, "ground_truth": 0}, {"key": "45884af9aff9abf54fec27f510c3f9ed000fc6e1", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.7853085947855354, "ground_truth": 0}, {"key": "45884af9aff9abf54fec27f510c3f9ed000fc6e1", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.8910549483357046, "ground_truth": 0}, {"key": "45884af9aff9abf54fec27f510c3f9ed000fc6e1", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.7879312003077356, "ground_truth": 0}, {"key": "59e60ba3c7ea5f5991db8ed4afd368c69e697dde", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.8840392937942896, "ground_truth": 0}, {"key": "59e60ba3c7ea5f5991db8ed4afd368c69e697dde", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.8925625247085736, "ground_truth": 0}, {"key": "59e60ba3c7ea5f5991db8ed4afd368c69e697dde", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.9246876931070155, "ground_truth": 0}, {"key": "59e60ba3c7ea5f5991db8ed4afd368c69e697dde", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.923592318874076, "ground_truth": 0}, {"key": "59e60ba3c7ea5f5991db8ed4afd368c69e697dde", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.9399133543643545, "ground_truth": 0}, {"key": "265ad4cbd8cbad94527db327a39c2d8f33db33ce", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.6791786943844029, "ground_truth": 0}, {"key": "265ad4cbd8cbad94527db327a39c2d8f33db33ce", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.8519528039382835, "ground_truth": 0}, {"key": "265ad4cbd8cbad94527db327a39c2d8f33db33ce", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.8933094043939064, "ground_truth": 0}, {"key": "265ad4cbd8cbad94527db327a39c2d8f33db33ce", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.6113819886628806, "ground_truth": 0}, {"key": "265ad4cbd8cbad94527db327a39c2d8f33db33ce", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.8044059223434065, "ground_truth": 0}, {"key": "54e68f9b7cdd209c09b2a47feef62b9082346031", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.9079671384428774, "ground_truth": 0}, {"key": "54e68f9b7cdd209c09b2a47feef62b9082346031", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.8864204176691083, "ground_truth": 0}, {"key": "54e68f9b7cdd209c09b2a47feef62b9082346031", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.8568122961187297, "ground_truth": 0}, {"key": "54e68f9b7cdd209c09b2a47feef62b9082346031", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.9437636524907997, "ground_truth": 0}, {"key": "54e68f9b7cdd209c09b2a47feef62b9082346031", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.856812295701091, "ground_truth": 0}, {"key": "3b5e3dff560e2233e8370c87e9d92461200f8bd4", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.5832033754913716, "ground_truth": 0}, {"key": "3b5e3dff560e2233e8370c87e9d92461200f8bd4", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.8104789210413863, "ground_truth": 0}, {"key": "3b5e3dff560e2233e8370c87e9d92461200f8bd4", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.6992544188902569, "ground_truth": 0}, {"key": "3b5e3dff560e2233e8370c87e9d92461200f8bd4", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.7279754500665844, "ground_truth": 0}, {"key": "3b5e3dff560e2233e8370c87e9d92461200f8bd4", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.6334102887057536, "ground_truth": 0}, {"key": "242c51d129c998a2585feee12e109a2058eb7c2b", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.8187367944658286, "ground_truth": 0}, {"key": "242c51d129c998a2585feee12e109a2058eb7c2b", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.8832359886384159, "ground_truth": 0}, {"key": "242c51d129c998a2585feee12e109a2058eb7c2b", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.7606506589388347, "ground_truth": 0}, {"key": "242c51d129c998a2585feee12e109a2058eb7c2b", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.8244619316071566, "ground_truth": 0}, {"key": "242c51d129c998a2585feee12e109a2058eb7c2b", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.6442251136470148, "ground_truth": 0}, {"key": "5ce92746bc1f4f5cbb25956c1289ffcd7f50f07e", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.8895288397145636, "ground_truth": 0}, {"key": "5ce92746bc1f4f5cbb25956c1289ffcd7f50f07e", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.8856314778377804, "ground_truth": 0}, {"key": "5ce92746bc1f4f5cbb25956c1289ffcd7f50f07e", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.8044059199883069, "ground_truth": 0}, {"key": "5ce92746bc1f4f5cbb25956c1289ffcd7f50f07e", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.8152324946910109, "ground_truth": 0}, {"key": "5ce92746bc1f4f5cbb25956c1289ffcd7f50f07e", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.8539127479497977, "ground_truth": 0}, {"key": "2f32a9eebbfa707a264d82a3bef5557f6b3b5f20", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.6388353040375117, "ground_truth": 0}, {"key": "2f32a9eebbfa707a264d82a3bef5557f6b3b5f20", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.702530050903841, "ground_truth": 0}, {"key": "2f32a9eebbfa707a264d82a3bef5557f6b3b5f20", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.8799743646326336, "ground_truth": 0}, {"key": "2f32a9eebbfa707a264d82a3bef5557f6b3b5f20", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.830043775299069, "ground_truth": 0}, {"key": "2f32a9eebbfa707a264d82a3bef5557f6b3b5f20", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.7892336967725767, "ground_truth": 0}, {"key": "57a373fa7d17600396fcee99164e79c0edccad14", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.9032942110257115, "ground_truth": 0}, {"key": "57a373fa7d17600396fcee99164e79c0edccad14", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.9407897521320933, "ground_truth": 0}, {"key": "57a373fa7d17600396fcee99164e79c0edccad14", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.9603611610888396, "ground_truth": 0}, {"key": "57a373fa7d17600396fcee99164e79c0edccad14", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.9099070071093466, "ground_truth": 0}, {"key": "57a373fa7d17600396fcee99164e79c0edccad14", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.8705972751299309, "ground_truth": 0}, {"key": "9b087c5572cc091c519625d37d1a614b97b8ed30", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.877476793438074, "ground_truth": 0}, {"key": "9b087c5572cc091c519625d37d1a614b97b8ed30", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.8902942166749723, "ground_truth": 0}, {"key": "9b087c5572cc091c519625d37d1a614b97b8ed30", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.8548846379249393, "ground_truth": 0}, {"key": "9b087c5572cc091c519625d37d1a614b97b8ed30", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.902609608643376, "ground_truth": 0}, {"key": "9b087c5572cc091c519625d37d1a614b97b8ed30", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.816406387307111, "ground_truth": 0}, {"key": "b5211115ff68e12e759a474a02d3b163211af563", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.6842640489076104, "ground_truth": 0}, {"key": "b5211115ff68e12e759a474a02d3b163211af563", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.8652240777211507, "ground_truth": 0}, {"key": "b5211115ff68e12e759a474a02d3b163211af563", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.8300437768941483, "ground_truth": 0}, {"key": "b5211115ff68e12e759a474a02d3b163211af563", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.8791467705987729, "ground_truth": 0}, {"key": "b5211115ff68e12e759a474a02d3b163211af563", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.8732148169348369, "ground_truth": 0}, {"key": "6b75abea2de5c9c9952af0427ccec78910ac811f", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.8740772317123913, "ground_truth": 0}, {"key": "6b75abea2de5c9c9952af0427ccec78910ac811f", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.8365545554124347, "ground_truth": 0}, {"key": "6b75abea2de5c9c9952af0427ccec78910ac811f", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.8006919956437748, "ground_truth": 0}, {"key": "6b75abea2de5c9c9952af0427ccec78910ac811f", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.9284088033225045, "ground_truth": 0}, {"key": "6b75abea2de5c9c9952af0427ccec78910ac811f", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.8019358265218146, "ground_truth": 0}, {"key": "259cc1db3d4c814dafc02ed071327f65a7b9eaad", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.7295197992966231, "ground_truth": 0}, {"key": "259cc1db3d4c814dafc02ed071327f65a7b9eaad", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.8140528024047401, "ground_truth": 0}, {"key": "259cc1db3d4c814dafc02ed071327f65a7b9eaad", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.759225412204469, "ground_truth": 0}, {"key": "259cc1db3d4c814dafc02ed071327f65a7b9eaad", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.6619228844526487, "ground_truth": 0}, {"key": "259cc1db3d4c814dafc02ed071327f65a7b9eaad", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.7490872193667467, "ground_truth": 0}, {"key": "3bb1cda1e01cb6e14f6190ced3b1ec3f7ef50de9", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.7341195502316903, "ground_truth": 0}, {"key": "3bb1cda1e01cb6e14f6190ced3b1ec3f7ef50de9", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.6460136933342912, "ground_truth": 0}, {"key": "3bb1cda1e01cb6e14f6190ced3b1ec3f7ef50de9", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.6943026864034, "ground_truth": 0}, {"key": "3bb1cda1e01cb6e14f6190ced3b1ec3f7ef50de9", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.7981867835463208, "ground_truth": 0}, {"key": "3bb1cda1e01cb6e14f6190ced3b1ec3f7ef50de9", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.8019358250779997, "ground_truth": 0}, {"key": "7afbe903f1f7cdc1af509583649babf481d01729", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.7943849501110334, "ground_truth": 0}, {"key": "7afbe903f1f7cdc1af509583649babf481d01729", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.8791467684386602, "ground_truth": 0}, {"key": "7afbe903f1f7cdc1af509583649babf481d01729", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.6943026721605087, "ground_truth": 0}, {"key": "7afbe903f1f7cdc1af509583649babf481d01729", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.7718435156548983, "ground_truth": 0}, {"key": "7afbe903f1f7cdc1af509583649babf481d01729", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.8679338528294291, "ground_truth": 0}, {"key": "79d625a3311f4ff11598a3ae4fca63103e84e9a1", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.9039745104849204, "ground_truth": 0}, {"key": "79d625a3311f4ff11598a3ae4fca63103e84e9a1", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.6566582919870387, "ground_truth": 0}, {"key": "79d625a3311f4ff11598a3ae4fca63103e84e9a1", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.848972191761808, "ground_truth": 0}, {"key": "79d625a3311f4ff11598a3ae4fca63103e84e9a1", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.8633916146473914, "ground_truth": 0}, {"key": "79d625a3311f4ff11598a3ae4fca63103e84e9a1", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.767689869971839, "ground_truth": 0}, {"key": "ea6c4267f17d55f1bd9f0950c31ef59565bdc30b", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.7154239996219869, "ground_truth": 0}, {"key": "ea6c4267f17d55f1bd9f0950c31ef59565bdc30b", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.78133061138868, "ground_truth": 0}, {"key": "ea6c4267f17d55f1bd9f0950c31ef59565bdc30b", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.7074047085129536, "ground_truth": 0}, {"key": "ea6c4267f17d55f1bd9f0950c31ef59565bdc30b", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.6926419718220238, "ground_truth": 0}, {"key": "ea6c4267f17d55f1bd9f0950c31ef59565bdc30b", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.7813306409908679, "ground_truth": 0}, {"key": "851d02b689bec14607574096bb77b9acf53c15ee", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.920217985847415, "ground_truth": 0}, {"key": "851d02b689bec14607574096bb77b9acf53c15ee", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.894051718250195, "ground_truth": 0}, {"key": "851d02b689bec14607574096bb77b9acf53c15ee", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.6876299925175163, "ground_truth": 0}, {"key": "851d02b689bec14607574096bb77b9acf53c15ee", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.8116760207092273, "ground_truth": 0}, {"key": "851d02b689bec14607574096bb77b9acf53c15ee", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.8749346229329366, "ground_truth": 0}, {"key": "f2d00c8c396698becc18fd2b41ba595c7a3e1cc6", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.9722043767215953, "ground_truth": 0}, {"key": "f2d00c8c396698becc18fd2b41ba595c7a3e1cc6", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.9796676439024322, "ground_truth": 0}, {"key": "f2d00c8c396698becc18fd2b41ba595c7a3e1cc6", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.9529258251782441, "ground_truth": 0}, {"key": "f2d00c8c396698becc18fd2b41ba595c7a3e1cc6", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.9840936094364057, "ground_truth": 0}, {"key": "f2d00c8c396698becc18fd2b41ba595c7a3e1cc6", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.9612438052319562, "ground_truth": 0}, {"key": "70c6ca3234f9b1221c8aea7671dd78e1ca9d9139", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.9012274087373773, "ground_truth": 0}, {"key": "70c6ca3234f9b1221c8aea7671dd78e1ca9d9139", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.839733969108671, "ground_truth": 0}, {"key": "70c6ca3234f9b1221c8aea7671dd78e1ca9d9139", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.7138307479298062, "ground_truth": 0}, {"key": "70c6ca3234f9b1221c8aea7671dd78e1ca9d9139", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.8044059219315117, "ground_truth": 0}, {"key": "70c6ca3234f9b1221c8aea7671dd78e1ca9d9139", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.9207896726193513, "ground_truth": 0}, {"key": "86eaa90c419d5ed93341248fecd8c25d820f2b82", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.9704646617717205, "ground_truth": 0}, {"key": "86eaa90c419d5ed93341248fecd8c25d820f2b82", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.9372107891255839, "ground_truth": 0}, {"key": "86eaa90c419d5ed93341248fecd8c25d820f2b82", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.8998277777365362, "ground_truth": 0}, {"key": "86eaa90c419d5ed93341248fecd8c25d820f2b82", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.9111797063975491, "ground_truth": 0}, {"key": "86eaa90c419d5ed93341248fecd8c25d820f2b82", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.9425067259899915, "ground_truth": 0}, {"key": "a1841cf61c53937fffc54c0e81d8f7cfcad2f0c2", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.8568122949089845, "ground_truth": 0}, {"key": "a1841cf61c53937fffc54c0e81d8f7cfcad2f0c2", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.8092759708217394, "ground_truth": 0}, {"key": "a1841cf61c53937fffc54c0e81d8f7cfcad2f0c2", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.9449947168131332, "ground_truth": 0}, {"key": "a1841cf61c53937fffc54c0e81d8f7cfcad2f0c2", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.8766343848511201, "ground_truth": 0}, {"key": "a1841cf61c53937fffc54c0e81d8f7cfcad2f0c2", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.9136765230190173, "ground_truth": 0}, {"key": "5d221c86fdadca378eeaabc39c881cc74efcff07", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.827828157142657, "ground_truth": 0}, {"key": "5d221c86fdadca378eeaabc39c881cc74efcff07", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.8152324907912836, "ground_truth": 0}, {"key": "5d221c86fdadca378eeaabc39c881cc74efcff07", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.7279754405883195, "ground_truth": 0}, {"key": "5d221c86fdadca378eeaabc39c881cc74efcff07", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.7401743582061225, "ground_truth": 0}, {"key": "5d221c86fdadca378eeaabc39c881cc74efcff07", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.8749346248593359, "ground_truth": 0}, {"key": "7a49f5bc1d336309f57076bceba91885ee5368b5", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.9339146229955986, "ground_truth": 0}, {"key": "7a49f5bc1d336309f57076bceba91885ee5368b5", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.9314625079479102, "ground_truth": 0}, {"key": "7a49f5bc1d336309f57076bceba91885ee5368b5", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.8311430566873738, "ground_truth": 0}, {"key": "7a49f5bc1d336309f57076bceba91885ee5368b5", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.9105453987423614, "ground_truth": 0}, {"key": "7a49f5bc1d336309f57076bceba91885ee5368b5", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.9489172652470024, "ground_truth": 0}, {"key": "dd46893fd318dce4e209f9a335612659ebf8fd24", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.73259183809239, "ground_truth": 0}, {"key": "dd46893fd318dce4e209f9a335612659ebf8fd24", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.8723473804071734, "ground_truth": 0}, {"key": "dd46893fd318dce4e209f9a335612659ebf8fd24", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.7416740391908838, "ground_truth": 0}, {"key": "dd46893fd318dce4e209f9a335612659ebf8fd24", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.8198933348321182, "ground_truth": 0}, {"key": "dd46893fd318dce4e209f9a335612659ebf8fd24", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.7201715094330758, "ground_truth": 0}, {"key": "acda8749fba5e9553e9f47cef89ef85eae5ad4e3", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.8006920093450042, "ground_truth": 0}, {"key": "acda8749fba5e9553e9f47cef89ef85eae5ad4e3", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.7057850337571814, "ground_truth": 0}, {"key": "acda8749fba5e9553e9f47cef89ef85eae5ad4e3", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.7446563481398046, "ground_truth": 0}, {"key": "acda8749fba5e9553e9f47cef89ef85eae5ad4e3", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.8080672146978951, "ground_truth": 0}, {"key": "acda8749fba5e9553e9f47cef89ef85eae5ad4e3", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.8068526321056185, "ground_truth": 0}, {"key": "20b11518df6520f552d691d5f6c0d02755d11809", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.8872045975446038, "ground_truth": 0}, {"key": "20b11518df6520f552d691d5f6c0d02755d11809", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.743167992983927, "ground_truth": 0}, {"key": "20b11518df6520f552d691d5f6c0d02755d11809", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.8519528134956715, "ground_truth": 0}, {"key": "20b11518df6520f552d691d5f6c0d02755d11809", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.9367494754064644, "ground_truth": 0}, {"key": "20b11518df6520f552d691d5f6c0d02755d11809", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.8175744829239266, "ground_truth": 0}, {"key": "51fe083191bb5568bf6a5fea1610a8e19663d7b2", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.7154240000874749, "ground_truth": 0}, {"key": "51fe083191bb5568bf6a5fea1610a8e19663d7b2", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.8449215246136332, "ground_truth": 0}, {"key": "51fe083191bb5568bf6a5fea1610a8e19663d7b2", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.8428631544046841, "ground_truth": 0}, {"key": "51fe083191bb5568bf6a5fea1610a8e19663d7b2", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.6242935224065919, "ground_truth": 0}, {"key": "51fe083191bb5568bf6a5fea1610a8e19663d7b2", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.737158161539073, "ground_truth": 0}, {"key": "8af047c2d83a91e8b745adfcaa7c282dfe1030a2", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.8354835504132216, "ground_truth": 0}, {"key": "8af047c2d83a91e8b745adfcaa7c282dfe1030a2", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.8449215326713939, "ground_truth": 0}, {"key": "8af047c2d83a91e8b745adfcaa7c282dfe1030a2", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.8116760068108716, "ground_truth": 0}, {"key": "8af047c2d83a91e8b745adfcaa7c282dfe1030a2", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.7520125612465767, "ground_truth": 0}, {"key": "8af047c2d83a91e8b745adfcaa7c282dfe1030a2", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.828938823571202, "ground_truth": 0}, {"key": "dfcacd955a9168b2cf599c57a539dbfce43ea2a9", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.7648916141640151, "ground_truth": 0}, {"key": "dfcacd955a9168b2cf599c57a539dbfce43ea2a9", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.7676898511059825, "ground_truth": 0}, {"key": "dfcacd955a9168b2cf599c57a539dbfce43ea2a9", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.9289263331415568, "ground_truth": 0}, {"key": "dfcacd955a9168b2cf599c57a539dbfce43ea2a9", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.8255897184703667, "ground_truth": 0}, {"key": "dfcacd955a9168b2cf599c57a539dbfce43ea2a9", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.8947894698977994, "ground_truth": 0}, {"key": "f2463954bc7215d8a1f98cf0d85f280fd2affa58", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.8080672137696701, "ground_truth": 0}, {"key": "f2463954bc7215d8a1f98cf0d85f280fd2affa58", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.8558511596981432, "ground_truth": 0}, {"key": "f2463954bc7215d8a1f98cf0d85f280fd2affa58", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.8376199712218515, "ground_truth": 0}, {"key": "f2463954bc7215d8a1f98cf0d85f280fd2affa58", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.7371581607294369, "ground_truth": 0}, {"key": "f2463954bc7215d8a1f98cf0d85f280fd2affa58", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.7956580944326999, "ground_truth": 0}, {"key": "0e7a92a6f06e94cdd613860d4a3f4b92a06a2b43", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.6187804161538462, "ground_truth": 0}, {"key": "0e7a92a6f06e94cdd613860d4a3f4b92a06a2b43", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.6757645876234, "ground_truth": 0}, {"key": "0e7a92a6f06e94cdd613860d4a3f4b92a06a2b43", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.6076631672239609, "ground_truth": 0}, {"key": "0e7a92a6f06e94cdd613860d4a3f4b92a06a2b43", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.7534666616516466, "ground_truth": 0}, {"key": "0e7a92a6f06e94cdd613860d4a3f4b92a06a2b43", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.8606036087307926, "ground_truth": 0}, {"key": "2905a15c5947042e42f4b52dc201d24822af20f1", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.9196425301155582, "ground_truth": 0}, {"key": "2905a15c5947042e42f4b52dc201d24822af20f1", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.923592321096131, "ground_truth": 0}, {"key": "2905a15c5947042e42f4b52dc201d24822af20f1", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.8278281461062966, "ground_truth": 0}, {"key": "2905a15c5947042e42f4b52dc201d24822af20f1", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.7772998545293205, "ground_truth": 0}, {"key": "2905a15c5947042e42f4b52dc201d24822af20f1", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.9309620709577614, "ground_truth": 0}, {"key": "808a3d788317af05686ee71a71d2fbc5c19267bc", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.752012583892895, "ground_truth": 0}, {"key": "808a3d788317af05686ee71a71d2fbc5c19267bc", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.7490872426625433, "ground_truth": 0}, {"key": "808a3d788317af05686ee71a71d2fbc5c19267bc", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.7866228396411342, "ground_truth": 0}, {"key": "808a3d788317af05686ee71a71d2fbc5c19267bc", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.8140528234273345, "ground_truth": 0}, {"key": "808a3d788317af05686ee71a71d2fbc5c19267bc", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.6460136961677142, "ground_truth": 0}, {"key": "5a1bec30205b6938392f3119366e27d15b4849e8", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.8624675261849243, "ground_truth": 0}, {"key": "5a1bec30205b6938392f3119366e27d15b4849e8", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.8499711770034911, "ground_truth": 0}, {"key": "5a1bec30205b6938392f3119366e27d15b4849e8", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.7310585556045907, "ground_truth": 0}, {"key": "5a1bec30205b6938392f3119366e27d15b4849e8", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.8019358292075552, "ground_truth": 0}, {"key": "5a1bec30205b6938392f3119366e27d15b4849e8", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.8006920094226181, "ground_truth": 0}, {"key": "7ff39e1220c0f084434786ed145e15c6abe48def", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.6706082821135491, "ground_truth": 0}, {"key": "7ff39e1220c0f084434786ed145e15c6abe48def", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.7839884648096995, "ground_truth": 0}, {"key": "7ff39e1220c0f084434786ed145e15c6abe48def", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.8386797598456718, "ground_truth": 0}, {"key": "7ff39e1220c0f084434786ed145e15c6abe48def", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.6926419768744461, "ground_truth": 0}, {"key": "7ff39e1220c0f084434786ed145e15c6abe48def", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.7431680206757746, "ground_truth": 0}, {"key": "7551503e7e57bd519913b0df90ca1e80d5305b05", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.848972184639786, "ground_truth": 0}, {"key": "7551503e7e57bd519913b0df90ca1e80d5305b05", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.9118099572100893, "ground_truth": 0}, {"key": "7551503e7e57bd519913b0df90ca1e80d5305b05", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.8633916140635856, "ground_truth": 0}, {"key": "7551503e7e57bd519913b0df90ca1e80d5305b05", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.767689852358099, "ground_truth": 0}, {"key": "7551503e7e57bd519913b0df90ca1e80d5305b05", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.8840392896301134, "ground_truth": 0}, {"key": "c34a0cbf6db61323766fc86b1b89b399ff6b0666", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.9105453966440742, "ground_truth": 0}, {"key": "c34a0cbf6db61323766fc86b1b89b399ff6b0666", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.8933094022826281, "ground_truth": 0}, {"key": "c34a0cbf6db61323766fc86b1b89b399ff6b0666", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.8732148328707515, "ground_truth": 0}, {"key": "c34a0cbf6db61323766fc86b1b89b399ff6b0666", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.9111797121533751, "ground_truth": 0}, {"key": "c34a0cbf6db61323766fc86b1b89b399ff6b0666", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.9246876946762773, "ground_truth": 0}, {"key": "d07a61368a195444b14bd4b382e0fc3d64890b22", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.8606036131466427, "ground_truth": 0}, {"key": "d07a61368a195444b14bd4b382e0fc3d64890b22", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.7295197725651605, "ground_truth": 0}, {"key": "d07a61368a195444b14bd4b382e0fc3d64890b22", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.8128673066015064, "ground_truth": 0}, {"key": "d07a61368a195444b14bd4b382e0fc3d64890b22", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.8140527977820572, "ground_truth": 0}, {"key": "d07a61368a195444b14bd4b382e0fc3d64890b22", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.7201715025799391, "ground_truth": 0}, {"key": "aa68dee4bc246e5aae9507342f8520a2a301a310", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.934395165513882, "ground_truth": 0}, {"key": "aa68dee4bc246e5aae9507342f8520a2a301a310", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.9173026559423506, "ground_truth": 0}, {"key": "aa68dee4bc246e5aae9507342f8520a2a301a310", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.7969253656583157, "ground_truth": 0}, {"key": "aa68dee4bc246e5aae9507342f8520a2a301a310", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.8354835393556427, "ground_truth": 0}, {"key": "aa68dee4bc246e5aae9507342f8520a2a301a310", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.9241418175898172, "ground_truth": 0}, {"key": "87ef15064035db73cb29f5cec2f0442f2c527ef0", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.8596637430911822, "ground_truth": 0}, {"key": "87ef15064035db73cb29f5cec2f0442f2c527ef0", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.798186773144639, "ground_truth": 0}, {"key": "87ef15064035db73cb29f5cec2f0442f2c527ef0", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.6774740197162639, "ground_truth": 0}, {"key": "87ef15064035db73cb29f5cec2f0442f2c527ef0", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.7866228263328704, "ground_truth": 0}, {"key": "87ef15064035db73cb29f5cec2f0442f2c527ef0", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.7534666485031821, "ground_truth": 0}, {"key": "a577b934e210ef7dce07390711f03db8bb2e005a", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.7620701184565218, "ground_truth": 0}, {"key": "a577b934e210ef7dce07390711f03db8bb2e005a", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.8056321872015815, "ground_truth": 0}, {"key": "a577b934e210ef7dce07390711f03db8bb2e005a", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.7490872252280348, "ground_truth": 0}, {"key": "a577b934e210ef7dce07390711f03db8bb2e005a", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.8652240832734981, "ground_truth": 0}, {"key": "a577b934e210ef7dce07390711f03db8bb2e005a", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.7905303083579718, "ground_truth": 0}, {"key": "c9414bf55859cb9ca7e925a4a09b416b6f66446a", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.9918120905253734, "ground_truth": 0}, {"key": "c9414bf55859cb9ca7e925a4a09b416b6f66446a", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.9929882043448154, "ground_truth": 0}, {"key": "c9414bf55859cb9ca7e925a4a09b416b6f66446a", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.9895916853628929, "ground_truth": 0}, {"key": "c9414bf55859cb9ca7e925a4a09b416b6f66446a", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.9890130569867187, "ground_truth": 0}, {"key": "c9414bf55859cb9ca7e925a4a09b416b6f66446a", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.9793540684905896, "ground_truth": 0}, {"key": "f12cda150b96acfa1499b2afb0a81029545abadf", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.9252299526374369, "ground_truth": 0}, {"key": "f12cda150b96acfa1499b2afb0a81029545abadf", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.9124361522925742, "ground_truth": 0}, {"key": "f12cda150b96acfa1499b2afb0a81029545abadf", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.9477691430323033, "ground_truth": 0}, {"key": "f12cda150b96acfa1499b2afb0a81029545abadf", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.9111797144274065, "ground_truth": 0}, {"key": "f12cda150b96acfa1499b2afb0a81029545abadf", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.9167080729799932, "ground_truth": 0}, {"key": "7359741b0e60b4402f069963a26c7aa766f45e7c", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.8092759814860554, "ground_truth": 0}, {"key": "7359741b0e60b4402f069963a26c7aa766f45e7c", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.8766343861062743, "ground_truth": 0}, {"key": "7359741b0e60b4402f069963a26c7aa766f45e7c", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.6636689544356354, "ground_truth": 0}, {"key": "7359741b0e60b4402f069963a26c7aa766f45e7c", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.7943849531264174, "ground_truth": 0}, {"key": "7359741b0e60b4402f069963a26c7aa766f45e7c", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.89330940530103, "ground_truth": 0}, {"key": "b10c71f49dbeabad23325d625e8e7b8529429607", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.9304582560835113, "ground_truth": 0}, {"key": "b10c71f49dbeabad23325d625e8e7b8529429607", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.8976952893117837, "ground_truth": 0}, {"key": "b10c71f49dbeabad23325d625e8e7b8529429607", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.9032942104241829, "ground_truth": 0}, {"key": "b10c71f49dbeabad23325d625e8e7b8529429607", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.9184802473314904, "ground_truth": 0}, {"key": "b10c71f49dbeabad23325d625e8e7b8529429607", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.9507778844809432, "ground_truth": 0}, {"key": "c5a1e04f5f84d406ffedfc2f312c314d1bc03c46", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.9433475740186437, "ground_truth": 0}, {"key": "c5a1e04f5f84d406ffedfc2f312c314d1bc03c46", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.8940517257281821, "ground_truth": 0}, {"key": "c5a1e04f5f84d406ffedfc2f312c314d1bc03c46", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.8459424352562713, "ground_truth": 0}, {"key": "c5a1e04f5f84d406ffedfc2f312c314d1bc03c46", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.896975569059444, "ground_truth": 0}, {"key": "c5a1e04f5f84d406ffedfc2f312c314d1bc03c46", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.871474865498067, "ground_truth": 0}, {"key": "8a5035d3527c4db4357dd1db9fb2712008dccea9", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.7074046919667367, "ground_truth": 0}, {"key": "8a5035d3527c4db4357dd1db9fb2712008dccea9", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.7799928910480228, "ground_truth": 0}, {"key": "8a5035d3527c4db4357dd1db9fb2712008dccea9", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.6206216094539297, "ground_truth": 0}, {"key": "8a5035d3527c4db4357dd1db9fb2712008dccea9", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.8080672025031109, "ground_truth": 0}, {"key": "8a5035d3527c4db4357dd1db9fb2712008dccea9", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.787931195710479, "ground_truth": 0}, {"key": "3f33d4cb25cd121619ba99eeb02709b72716d622", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.9496693675610849, "ground_truth": 0}, {"key": "3f33d4cb25cd121619ba99eeb02709b72716d622", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.9848109505313505, "ground_truth": 0}, {"key": "3f33d4cb25cd121619ba99eeb02709b72716d622", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.9425067191086735, "ground_truth": 0}, {"key": "3f33d4cb25cd121619ba99eeb02709b72716d622", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.9844563536455181, "ground_truth": 0}, {"key": "3f33d4cb25cd121619ba99eeb02709b72716d622", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.9777138148433517, "ground_truth": 0}, {"key": "e6f451d6667f142a64818a9d05dbc49115e7cbf9", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.9289263290253241, "ground_truth": 0}, {"key": "e6f451d6667f142a64818a9d05dbc49115e7cbf9", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.9304582549434318, "ground_truth": 0}, {"key": "e6f451d6667f142a64818a9d05dbc49115e7cbf9", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.9073122140901299, "ground_truth": 0}, {"key": "e6f451d6667f142a64818a9d05dbc49115e7cbf9", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.9353465078259896, "ground_truth": 0}, {"key": "e6f451d6667f142a64818a9d05dbc49115e7cbf9", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.9458012727603918, "ground_truth": 0}, {"key": "39622c01625247af942a6439699ff529db1d54d0", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.7704647879687371, "ground_truth": 0}, {"key": "39622c01625247af942a6439699ff529db1d54d0", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.7563575421619796, "ground_truth": 0}, {"key": "39622c01625247af942a6439699ff529db1d54d0", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.8449215254995193, "ground_truth": 0}, {"key": "39622c01625247af942a6439699ff529db1d54d0", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.6876299897977768, "ground_truth": 0}, {"key": "39622c01625247af942a6439699ff529db1d54d0", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.7201714931627916, "ground_truth": 0}, {"key": "02927c88776bcc84fc883435a5037b4c8ca70e83", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.8104789083376024, "ground_truth": 0}, {"key": "02927c88776bcc84fc883435a5037b4c8ca70e83", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.8438951153598384, "ground_truth": 0}, {"key": "02927c88776bcc84fc883435a5037b4c8ca70e83", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.6893056258338449, "ground_truth": 0}, {"key": "02927c88776bcc84fc883435a5037b4c8ca70e83", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.8509647000493682, "ground_truth": 0}, {"key": "02927c88776bcc84fc883435a5037b4c8ca70e83", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.8164063751139832, "ground_truth": 0}, {"key": "3ee31d8987c07ba4ea9423d39c5e333525316958", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.902609600518878, "ground_truth": 0}, {"key": "3ee31d8987c07ba4ea9423d39c5e333525316958", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.9046505339489042, "ground_truth": 0}, {"key": "3ee31d8987c07ba4ea9423d39c5e333525316958", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.8991213737499134, "ground_truth": 0}, {"key": "3ee31d8987c07ba4ea9423d39c5e333525316958", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.9196425328664612, "ground_truth": 0}, {"key": "3ee31d8987c07ba4ea9423d39c5e333525316958", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.9155072406073422, "ground_truth": 0}, {"key": "f8ddc6d36f378757d27a244529f8fe11672baa41", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.5813030981912289, "ground_truth": 0}, {"key": "f8ddc6d36f378757d27a244529f8fe11672baa41", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.7549150035511137, "ground_truth": 0}, {"key": "f8ddc6d36f378757d27a244529f8fe11672baa41", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.6442251233494382, "ground_truth": 0}, {"key": "f8ddc6d36f378757d27a244529f8fe11672baa41", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.6893056243677704, "ground_truth": 0}, {"key": "f8ddc6d36f378757d27a244529f8fe11672baa41", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.8044059222746905, "ground_truth": 0}, {"key": "4e97228ceef1be54ab9151fc6759017e6a54a18d", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.670608299834579, "ground_truth": 0}, {"key": "4e97228ceef1be54ab9151fc6759017e6a54a18d", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.665410556335315, "ground_truth": 0}, {"key": "4e97228ceef1be54ab9151fc6759017e6a54a18d", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.7690802432184954, "ground_truth": 0}, {"key": "4e97228ceef1be54ab9151fc6759017e6a54a18d", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.7041601316095982, "ground_truth": 0}, {"key": "4e97228ceef1be54ab9151fc6759017e6a54a18d", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.6774740362169236, "ground_truth": 0}, {"key": "0e649ccabaf0e650e9757ee256c2749d37486ba6", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.7866228444167509, "ground_truth": 0}, {"key": "0e649ccabaf0e650e9757ee256c2749d37486ba6", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.7563575497537289, "ground_truth": 0}, {"key": "0e649ccabaf0e650e9757ee256c2749d37486ba6", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.5448013945923937, "ground_truth": 0}, {"key": "0e649ccabaf0e650e9757ee256c2749d37486ba6", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.629774590863264, "ground_truth": 0}, {"key": "0e649ccabaf0e650e9757ee256c2749d37486ba6", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.7090191547112927, "ground_truth": 0}, {"key": "9eccfcc231c7c0d65cb0c333cb3d1731a5fe2f3f", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.8175744732409518, "ground_truth": 0}, {"key": "9eccfcc231c7c0d65cb0c333cb3d1731a5fe2f3f", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.8386797552091223, "ground_truth": 0}, {"key": "9eccfcc231c7c0d65cb0c333cb3d1731a5fe2f3f", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.8152324842686322, "ground_truth": 0}, {"key": "9eccfcc231c7c0d65cb0c333cb3d1731a5fe2f3f", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.8210440947864227, "ground_truth": 0}, {"key": "9eccfcc231c7c0d65cb0c333cb3d1731a5fe2f3f", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.8438950884847541, "ground_truth": 0}, {"key": "ddf109b3de6022a4ecd62ee2cd31d2c2ac51035b", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.8438950952074338, "ground_truth": 0}, {"key": "ddf109b3de6022a4ecd62ee2cd31d2c2ac51035b", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.8902942289119546, "ground_truth": 0}, {"key": "ddf109b3de6022a4ecd62ee2cd31d2c2ac51035b", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.9246876938643596, "ground_truth": 0}, {"key": "ddf109b3de6022a4ecd62ee2cd31d2c2ac51035b", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.8407825923069667, "ground_truth": 0}, {"key": "ddf109b3de6022a4ecd62ee2cd31d2c2ac51035b", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.886420411854083, "ground_truth": 0}, {"key": "bd92eab23374d95ac4430e2e1a8bf7561c662309", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.8278281744586787, "ground_truth": 0}, {"key": "bd92eab23374d95ac4430e2e1a8bf7561c662309", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.9252299534905036, "ground_truth": 0}, {"key": "bd92eab23374d95ac4430e2e1a8bf7561c662309", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.78133061261589, "ground_truth": 0}, {"key": "bd92eab23374d95ac4430e2e1a8bf7561c662309", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.9372107931999315, "ground_truth": 0}, {"key": "bd92eab23374d95ac4430e2e1a8bf7561c662309", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.892562512856659, "ground_truth": 0}, {"key": "d84440effc748f9220c7dde068962e803f566bc7", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.8832359854494674, "ground_truth": 0}, {"key": "d84440effc748f9220c7dde068962e803f566bc7", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.7826624608394792, "ground_truth": 0}, {"key": "d84440effc748f9220c7dde068962e803f566bc7", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.8766343871159943, "ground_truth": 0}, {"key": "d84440effc748f9220c7dde068962e803f566bc7", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.9329437129858001, "ground_truth": 0}, {"key": "d84440effc748f9220c7dde068962e803f566bc7", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.7295197664197253, "ground_truth": 0}, {"key": "e2866f596c85b0191ce812260d23855c70a01192", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.7310585896520999, "ground_truth": 0}, {"key": "e2866f596c85b0191ce812260d23855c70a01192", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.8198933385255074, "ground_truth": 0}, {"key": "e2866f596c85b0191ce812260d23855c70a01192", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.7233094754123257, "ground_truth": 0}, {"key": "e2866f596c85b0191ce812260d23855c70a01192", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.8596637574056744, "ground_truth": 0}, {"key": "e2866f596c85b0191ce812260d23855c70a01192", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.8233283987397539, "ground_truth": 0}, {"key": "4ebd9195bc8c12272b6281a5a610a7b5fb49b8cd", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.923039162806807, "ground_truth": 0}, {"key": "4ebd9195bc8c12272b6281a5a610a7b5fb49b8cd", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.9449947181641885, "ground_truth": 0}, {"key": "4ebd9195bc8c12272b6281a5a610a7b5fb49b8cd", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.9394706055825103, "ground_truth": 0}, {"key": "4ebd9195bc8c12272b6281a5a610a7b5fb49b8cd", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.8910549516292298, "ground_truth": 0}, {"key": "4ebd9195bc8c12272b6281a5a610a7b5fb49b8cd", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.9511422195210876, "ground_truth": 0}, {"key": "4bd37aa7004cd1fdf1ccb506d2159a2cf26995e0", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.7759445578121217, "ground_truth": 0}, {"key": "4bd37aa7004cd1fdf1ccb506d2159a2cf26995e0", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.7892337024874955, "ground_truth": 0}, {"key": "4bd37aa7004cd1fdf1ccb506d2159a2cf26995e0", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.8652240822108741, "ground_truth": 0}, {"key": "4bd37aa7004cd1fdf1ccb506d2159a2cf26995e0", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.8449215453835455, "ground_truth": 0}, {"key": "4bd37aa7004cd1fdf1ccb506d2159a2cf26995e0", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.8068526290208999, "ground_truth": 0}, {"key": "29b87dc549b8c64b35517e684e79b1da6316bd88", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.7786493009129333, "ground_truth": 0}, {"key": "29b87dc549b8c64b35517e684e79b1da6316bd88", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.7994423188513964, "ground_truth": 0}, {"key": "29b87dc549b8c64b35517e684e79b1da6316bd88", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.8233284020484101, "ground_truth": 0}, {"key": "29b87dc549b8c64b35517e684e79b1da6316bd88", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.7918210524788353, "ground_truth": 0}, {"key": "29b87dc549b8c64b35517e684e79b1da6316bd88", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.6992544313892913, "ground_truth": 0}, {"key": "d2f2fe0b8797b416bae71305c9d1c874e2fdd0cc", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.6876300074580043, "ground_truth": 0}, {"key": "d2f2fe0b8797b416bae71305c9d1c874e2fdd0cc", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.6636689722427752, "ground_truth": 0}, {"key": "d2f2fe0b8797b416bae71305c9d1c874e2fdd0cc", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.6959583255587982, "ground_truth": 0}, {"key": "d2f2fe0b8797b416bae71305c9d1c874e2fdd0cc", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.6688802552820118, "ground_truth": 0}, {"key": "d2f2fe0b8797b416bae71305c9d1c874e2fdd0cc", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.6352224229081351, "ground_truth": 0}, {"key": "0269d39abbea3edadd225fa97d818f5a789b4c72", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.7704647832132573, "ground_truth": 0}, {"key": "0269d39abbea3edadd225fa97d818f5a789b4c72", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.8902942289119546, "ground_truth": 0}, {"key": "0269d39abbea3edadd225fa97d818f5a789b4c72", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.8697145790113624, "ground_truth": 0}, {"key": "0269d39abbea3edadd225fa97d818f5a789b4c72", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.8044059181730787, "ground_truth": 0}, {"key": "0269d39abbea3edadd225fa97d818f5a789b4c72", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.9224823397804269, "ground_truth": 0}, {"key": "394f20c9bee9bc8d0e6a65bac48de57bd9f4733d", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.8300437779771404, "ground_truth": 0}, {"key": "394f20c9bee9bc8d0e6a65bac48de57bd9f4733d", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.7969253584352353, "ground_truth": 0}, {"key": "394f20c9bee9bc8d0e6a65bac48de57bd9f4733d", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.5736784346862197, "ground_truth": 0}, {"key": "394f20c9bee9bc8d0e6a65bac48de57bd9f4733d", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.6513548662617725, "ground_truth": 0}, {"key": "394f20c9bee9bc8d0e6a65bac48de57bd9f4733d", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.8019358227263899, "ground_truth": 0}, {"key": "6e63c8b1ae01ab91b4832222edaf4bb461b6c568", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.7217432025578615, "ground_truth": 0}, {"key": "6e63c8b1ae01ab91b4832222edaf4bb461b6c568", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.8289388117988059, "ground_truth": 0}, {"key": "6e63c8b1ae01ab91b4832222edaf4bb461b6c568", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.7732163735511289, "ground_truth": 0}, {"key": "6e63c8b1ae01ab91b4832222edaf4bb461b6c568", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.8539127494153766, "ground_truth": 0}, {"key": "6e63c8b1ae01ab91b4832222edaf4bb461b6c568", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.7505527491387028, "ground_truth": 0}, {"key": "355875856932fd634aaf7c6b26155403aaf15904", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.9603611597296169, "ground_truth": 0}, {"key": "355875856932fd634aaf7c6b26155403aaf15904", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.9433475766700852, "ground_truth": 0}, {"key": "355875856932fd634aaf7c6b26155403aaf15904", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.9314625051639911, "ground_truth": 0}, {"key": "355875856932fd634aaf7c6b26155403aaf15904", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.9529258247138317, "ground_truth": 0}, {"key": "355875856932fd634aaf7c6b26155403aaf15904", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.9429285990303287, "ground_truth": 0}, {"key": "999523913d281ab57977d79b644f3879ac4d2e37", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.7606506621773048, "ground_truth": 0}, {"key": "999523913d281ab57977d79b644f3879ac4d2e37", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.7074046815675451, "ground_truth": 0}, {"key": "999523913d281ab57977d79b644f3879ac4d2e37", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.8459424388366515, "ground_truth": 0}, {"key": "999523913d281ab57977d79b644f3879ac4d2e37", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.7943849474785464, "ground_truth": 0}, {"key": "999523913d281ab57977d79b644f3879ac4d2e37", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.7534666577830456, "ground_truth": 0}, {"key": "5f7424604ec11358dc6fdfa47732f90422949041", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.8688267718836002, "ground_truth": 0}, {"key": "5f7424604ec11358dc6fdfa47732f90422949041", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.8080671984318039, "ground_truth": 0}, {"key": "5f7424604ec11358dc6fdfa47732f90422949041", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.7356416340910242, "ground_truth": 0}, {"key": "5f7424604ec11358dc6fdfa47732f90422949041", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.8479677540012992, "ground_truth": 0}, {"key": "5f7424604ec11358dc6fdfa47732f90422949041", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.8407825995113901, "ground_truth": 0}, {"key": "fdb2b65b9cb99b7d52559ae647cae293cb5910d3", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.8449215284195405, "ground_truth": 0}, {"key": "fdb2b65b9cb99b7d52559ae647cae293cb5910d3", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.7371581745472434, "ground_truth": 0}, {"key": "fdb2b65b9cb99b7d52559ae647cae293cb5910d3", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.8489722014096076, "ground_truth": 0}, {"key": "fdb2b65b9cb99b7d52559ae647cae293cb5910d3", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.7969253666239976, "ground_truth": 0}, {"key": "fdb2b65b9cb99b7d52559ae647cae293cb5910d3", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.828938817443719, "ground_truth": 0}, {"key": "f974fe1b3777ffc5756322c0bb3f31a9b23ec09a", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.8469578415239684, "ground_truth": 0}, {"key": "f974fe1b3777ffc5756322c0bb3f31a9b23ec09a", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.7356416431536087, "ground_truth": 0}, {"key": "f974fe1b3777ffc5756322c0bb3f31a9b23ec09a", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.8519528107178514, "ground_truth": 0}, {"key": "f974fe1b3777ffc5756322c0bb3f31a9b23ec09a", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.7201714838086802, "ground_truth": 0}, {"key": "f974fe1b3777ffc5756322c0bb3f31a9b23ec09a", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.853912748569709, "ground_truth": 0}, {"key": "2930e1a7ac24bce649bfbf5f5971e74515e38a0a", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.8774767844615385, "ground_truth": 0}, {"key": "2930e1a7ac24bce649bfbf5f5971e74515e38a0a", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.8902942248064102, "ground_truth": 0}, {"key": "2930e1a7ac24bce649bfbf5f5971e74515e38a0a", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.9219218422000018, "ground_truth": 0}, {"key": "2930e1a7ac24bce649bfbf5f5971e74515e38a0a", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.8187367881609878, "ground_truth": 0}, {"key": "2930e1a7ac24bce649bfbf5f5971e74515e38a0a", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.8519528054274125, "ground_truth": 0}, {"key": "f5f7571a69e96c1d288d939861b7216c2bdc0ae4", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.817574478523308, "ground_truth": 0}, {"key": "f5f7571a69e96c1d288d939861b7216c2bdc0ae4", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.8428631434782802, "ground_truth": 0}, {"key": "f5f7571a69e96c1d288d939861b7216c2bdc0ae4", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.8519528089668269, "ground_truth": 0}, {"key": "f5f7571a69e96c1d288d939861b7216c2bdc0ae4", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.8386797570762118, "ground_truth": 0}, {"key": "f5f7571a69e96c1d288d939861b7216c2bdc0ae4", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.8807970794393135, "ground_truth": 0}, {"key": "5f02aa32bd1dc95e47355755398e31550b232f8a", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.8652240810907516, "ground_truth": 0}, {"key": "5f02aa32bd1dc95e47355755398e31550b232f8a", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.8333245959287002, "ground_truth": 0}, {"key": "5f02aa32bd1dc95e47355755398e31550b232f8a", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.868826785879826, "ground_truth": 0}, {"key": "5f02aa32bd1dc95e47355755398e31550b232f8a", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.8816149028103062, "ground_truth": 0}, {"key": "5f02aa32bd1dc95e47355755398e31550b232f8a", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.8848377639123038, "ground_truth": 0}, {"key": "9177e5ac94f038749e8d4eb526a65461e0f6df4c", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.7676898571929751, "ground_truth": 0}, {"key": "9177e5ac94f038749e8d4eb526a65461e0f6df4c", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.7690802466438169, "ground_truth": 0}, {"key": "9177e5ac94f038749e8d4eb526a65461e0f6df4c", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.8044059201978557, "ground_truth": 0}, {"key": "9177e5ac94f038749e8d4eb526a65461e0f6df4c", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.7981867809911128, "ground_truth": 0}, {"key": "9177e5ac94f038749e8d4eb526a65461e0f6df4c", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.7994423107587209, "ground_truth": 0}, {"key": "f12e4bbb07211de7d43b4e331dc73404aa804562", "model": "xsum_random_ft_llama", "target_model": "llama", "recognition_score": 0.984336350780211, "ground_truth": 0}, {"key": "f12e4bbb07211de7d43b4e331dc73404aa804562", "model": "xsum_random_ft_llama", "target_model": "human", "recognition_score": 0.9953544426489149, "ground_truth": 0}, {"key": "f12e4bbb07211de7d43b4e331dc73404aa804562", "model": "xsum_random_ft_llama", "target_model": "claude", "recognition_score": 0.9943140931843432, "ground_truth": 0}, {"key": "f12e4bbb07211de7d43b4e331dc73404aa804562", "model": "xsum_random_ft_llama", "target_model": "gpt4", "recognition_score": 0.9918120905808615, "ground_truth": 0}, {"key": "f12e4bbb07211de7d43b4e331dc73404aa804562", "model": "xsum_random_ft_llama", "target_model": "gpt35", "recognition_score": 0.9960237719141846, "ground_truth": 0}]