[{"key": "42c027e4ff9730fbb3de84c1af0d2c506e41c3e4", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.7826624800438606, "ground_truth": 0}, {"key": "42c027e4ff9730fbb3de84c1af0d2c506e41c3e4", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.6959583236098693, "ground_truth": 0}, {"key": "42c027e4ff9730fbb3de84c1af0d2c506e41c3e4", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.6859494537426923, "ground_truth": 0}, {"key": "42c027e4ff9730fbb3de84c1af0d2c506e41c3e4", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.4339814819578486, "ground_truth": 0}, {"key": "42c027e4ff9730fbb3de84c1af0d2c506e41c3e4", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.7476159564270473, "ground_truth": 0}, {"key": "ee8871b15c50d0db17b0179a6d2beab35065f1e9", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.3123700360130557, "ground_truth": 0}, {"key": "ee8871b15c50d0db17b0179a6d2beab35065f1e9", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.24653334897033977, "ground_truth": 0}, {"key": "ee8871b15c50d0db17b0179a6d2beab35065f1e9", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.5428632697170156, "ground_truth": 0}, {"key": "ee8871b15c50d0db17b0179a6d2beab35065f1e9", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.5506073704020945, "ground_truth": 0}, {"key": "ee8871b15c50d0db17b0179a6d2beab35065f1e9", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.4941408688653044, "ground_truth": 0}, {"key": "06352019a19ae31e527f37f7571c6dd7f0c5da37", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.39233683783566514, "ground_truth": 0}, {"key": "06352019a19ae31e527f37f7571c6dd7f0c5da37", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.6531269133705717, "ground_truth": 0}, {"key": "06352019a19ae31e527f37f7571c6dd7f0c5da37", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.5156199214854935, "ground_truth": 0}, {"key": "06352019a19ae31e527f37f7571c6dd7f0c5da37", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.2925953002804101, "ground_truth": 0}, {"key": "06352019a19ae31e527f37f7571c6dd7f0c5da37", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.32939172467077954, "ground_truth": 0}, {"key": "24521a2abb2e1f5e34e6824e0f9e56904a2b0e88", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.8633916025640935, "ground_truth": 0}, {"key": "24521a2abb2e1f5e34e6824e0f9e56904a2b0e88", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.9173026566374144, "ground_truth": 0}, {"key": "24521a2abb2e1f5e34e6824e0f9e56904a2b0e88", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.8499711840021686, "ground_truth": 0}, {"key": "24521a2abb2e1f5e34e6824e0f9e56904a2b0e88", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.7122321855314133, "ground_truth": 0}, {"key": "24521a2abb2e1f5e34e6824e0f9e56904a2b0e88", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.955319127703864, "ground_truth": 0}, {"key": "7fe70cc8b12fab2d0a258fababf7d9c6b5e1262a", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.7592253954122268, "ground_truth": 0}, {"key": "7fe70cc8b12fab2d0a258fababf7d9c6b5e1262a", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.9039745090204635, "ground_truth": 0}, {"key": "7fe70cc8b12fab2d0a258fababf7d9c6b5e1262a", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.6825737266528815, "ground_truth": 0}, {"key": "7fe70cc8b12fab2d0a258fababf7d9c6b5e1262a", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.7799928882063214, "ground_truth": 0}, {"key": "7fe70cc8b12fab2d0a258fababf7d9c6b5e1262a", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.8652240788334934, "ground_truth": 0}, {"key": "a1ebb8bb4d370a1fdf28769206d572be60642d70", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.6791786871613076, "ground_truth": 0}, {"key": "a1ebb8bb4d370a1fdf28769206d572be60642d70", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.4941408722091386, "ground_truth": 0}, {"key": "a1ebb8bb4d370a1fdf28769206d572be60642d70", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.7759445402549345, "ground_truth": 0}, {"key": "a1ebb8bb4d370a1fdf28769206d572be60642d70", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.5544704464784456, "ground_truth": 0}, {"key": "a1ebb8bb4d370a1fdf28769206d572be60642d70", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.6315942897560466, "ground_truth": 0}, {"key": "7c0e61ac829a3b3b653e2e3e7536cc4881d1f264", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.26894143766464895, "ground_truth": 0}, {"key": "7c0e61ac829a3b3b653e2e3e7536cc4881d1f264", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.27825679159612127, "ground_truth": 0}, {"key": "7c0e61ac829a3b3b653e2e3e7536cc4881d1f264", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.22135068154063595, "ground_truth": 0}, {"key": "7c0e61ac829a3b3b653e2e3e7536cc4881d1f264", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.32766828461474856, "ground_truth": 0}, {"key": "7c0e61ac829a3b3b653e2e3e7536cc4881d1f264", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.3157359860934637, "ground_truth": 0}, {"key": "f0d73bdab711763e745cdc75850861c9018f235d", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.839733975920624, "ground_truth": 0}, {"key": "f0d73bdab711763e745cdc75850861c9018f235d", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.5964331643380165, "ground_truth": 0}, {"key": "f0d73bdab711763e745cdc75850861c9018f235d", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.7154239862825291, "ground_truth": 0}, {"key": "f0d73bdab711763e745cdc75850861c9018f235d", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.7386690791579381, "ground_truth": 0}, {"key": "f0d73bdab711763e745cdc75850861c9018f235d", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.7759445594567517, "ground_truth": 0}, {"key": "5e22bbfc7232418b8d2dd646b952e404df5bd048", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.8080672029995908, "ground_truth": 0}, {"key": "5e22bbfc7232418b8d2dd646b952e404df5bd048", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.6224593250268327, "ground_truth": 0}, {"key": "5e22bbfc7232418b8d2dd646b952e404df5bd048", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.8587185793593196, "ground_truth": 0}, {"key": "5e22bbfc7232418b8d2dd646b952e404df5bd048", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.5409238601116266, "ground_truth": 0}, {"key": "5e22bbfc7232418b8d2dd646b952e404df5bd048", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.8984105471049433, "ground_truth": 0}, {"key": "613d6311ec2c1985bd44707d1796d275452fe156", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.6169358377815606, "ground_truth": 0}, {"key": "613d6311ec2c1985bd44707d1796d275452fe156", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.6601723815963473, "ground_truth": 0}, {"key": "613d6311ec2c1985bd44707d1796d275452fe156", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.5253688227707926, "ground_truth": 0}, {"key": "613d6311ec2c1985bd44707d1796d275452fe156", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.38306417524226877, "ground_truth": 0}, {"key": "613d6311ec2c1985bd44707d1796d275452fe156", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.642432481574305, "ground_truth": 0}, {"key": "017d27d00eb43678c15cb4a8dd4723a035323219", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.5234203490809818, "ground_truth": 0}, {"key": "017d27d00eb43678c15cb4a8dd4723a035323219", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.397938419846793, "ground_truth": 0}, {"key": "017d27d00eb43678c15cb4a8dd4723a035323219", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.3886180315164083, "ground_truth": 0}, {"key": "017d27d00eb43678c15cb4a8dd4723a035323219", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.4824291101349116, "ground_truth": 0}, {"key": "017d27d00eb43678c15cb4a8dd4723a035323219", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.5583269676981668, "ground_truth": 0}, {"key": "85f55a3e0dd672857aaaaa80954934a57b7a2fbf", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.44552954274309586, "ground_truth": 0}, {"key": "85f55a3e0dd672857aaaaa80954934a57b7a2fbf", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.6039318449522642, "ground_truth": 0}, {"key": "85f55a3e0dd672857aaaaa80954934a57b7a2fbf", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.7371581416458617, "ground_truth": 0}, {"key": "85f55a3e0dd672857aaaaa80954934a57b7a2fbf", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.7170118876616306, "ground_truth": 0}, {"key": "85f55a3e0dd672857aaaaa80954934a57b7a2fbf", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.33458944902346976, "ground_truth": 0}, {"key": "77d7c8cf2a9432e395d629371a12790c563c19f7", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.769080227425339, "ground_truth": 0}, {"key": "77d7c8cf2a9432e395d629371a12790c563c19f7", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.8175744886043789, "ground_truth": 0}, {"key": "77d7c8cf2a9432e395d629371a12790c563c19f7", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.7233094435356163, "ground_truth": 0}, {"key": "77d7c8cf2a9432e395d629371a12790c563c19f7", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.674050503319548, "ground_truth": 0}, {"key": "77d7c8cf2a9432e395d629371a12790c563c19f7", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.8624675383439472, "ground_truth": 0}, {"key": "35f0e33de7923036a97ac245d899f990bda5e242", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.8175744743173673, "ground_truth": 0}, {"key": "35f0e33de7923036a97ac245d899f990bda5e242", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.7943849632887725, "ground_truth": 0}, {"key": "35f0e33de7923036a97ac245d899f990bda5e242", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.8624675408311453, "ground_truth": 0}, {"key": "35f0e33de7923036a97ac245d899f990bda5e242", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.8670357616624538, "ground_truth": 0}, {"key": "35f0e33de7923036a97ac245d899f990bda5e242", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.7341195205105855, "ground_truth": 0}, {"key": "2ad31cae96512af5105b9b23f9b681dc732b2605", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.7634837729633636, "ground_truth": 0}, {"key": "2ad31cae96512af5105b9b23f9b681dc732b2605", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.7416740068605273, "ground_truth": 0}, {"key": "2ad31cae96512af5105b9b23f9b681dc732b2605", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.7505527550496631, "ground_truth": 0}, {"key": "2ad31cae96512af5105b9b23f9b681dc732b2605", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.7008947908435282, "ground_truth": 0}, {"key": "2ad31cae96512af5105b9b23f9b681dc732b2605", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.764891614311252, "ground_truth": 0}, {"key": "0d43b97000ff852282c89d8d105e41495c0ee9bd", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.6976089189575122, "ground_truth": 0}, {"key": "0d43b97000ff852282c89d8d105e41495c0ee9bd", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.4843800905865266, "ground_truth": 0}, {"key": "0d43b97000ff852282c89d8d105e41495c0ee9bd", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.4902356219987511, "ground_truth": 0}, {"key": "0d43b97000ff852282c89d8d105e41495c0ee9bd", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.6076631542337699, "ground_truth": 0}, {"key": "0d43b97000ff852282c89d8d105e41495c0ee9bd", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.8278281580528062, "ground_truth": 0}, {"key": "bf0cd4ccacd4fe045995338f4c44d9cf18000226", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.8548846399490533, "ground_truth": 0}, {"key": "bf0cd4ccacd4fe045995338f4c44d9cf18000226", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.7563575872103317, "ground_truth": 0}, {"key": "bf0cd4ccacd4fe045995338f4c44d9cf18000226", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.5506073580968776, "ground_truth": 0}, {"key": "bf0cd4ccacd4fe045995338f4c44d9cf18000226", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.9268352818584781, "ground_truth": 0}, {"key": "bf0cd4ccacd4fe045995338f4c44d9cf18000226", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.6740504776576369, "ground_truth": 0}, {"key": "2f43e9dfaa43ffbddbce339a8b6403ddce43b38a", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.45326184441880313, "ground_truth": 0}, {"key": "2f43e9dfaa43ffbddbce339a8b6403ddce43b38a", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.40168779513029335, "ground_truth": 0}, {"key": "2f43e9dfaa43ffbddbce339a8b6403ddce43b38a", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.6206216265886475, "ground_truth": 0}, {"key": "2f43e9dfaa43ffbddbce339a8b6403ddce43b38a", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.5486735135513002, "ground_truth": 0}, {"key": "2f43e9dfaa43ffbddbce339a8b6403ddce43b38a", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.47463118907658, "ground_truth": 0}, {"key": "eb68bc51ed4fc727a1af058192a3fef0916c91e7", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.5583269758972557, "ground_truth": 0}, {"key": "eb68bc51ed4fc727a1af058192a3fef0916c91e7", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.5907792040610577, "ground_truth": 0}, {"key": "eb68bc51ed4fc727a1af058192a3fef0916c91e7", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.52342033202326, "ground_truth": 0}, {"key": "eb68bc51ed4fc727a1af058192a3fef0916c91e7", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.38676342636200234, "ground_truth": 0}, {"key": "eb68bc51ed4fc727a1af058192a3fef0916c91e7", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.3468730756989024, "ground_truth": 0}, {"key": "ad021a7924ee57491cee8576499ac196b1afeb23", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.6495786196470771, "ground_truth": 0}, {"key": "ad021a7924ee57491cee8576499ac196b1afeb23", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.7416740082960633, "ground_truth": 0}, {"key": "ad021a7924ee57491cee8576499ac196b1afeb23", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.7592253921198464, "ground_truth": 0}, {"key": "ad021a7924ee57491cee8576499ac196b1afeb23", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.872347384904154, "ground_truth": 0}, {"key": "ad021a7924ee57491cee8576499ac196b1afeb23", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.8548846270249788, "ground_truth": 0}, {"key": "9d7fc7fd9ffbfecb1c458b9929fa02e6c3538368", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.6334102664015294, "ground_truth": 0}, {"key": "9d7fc7fd9ffbfecb1c458b9929fa02e6c3538368", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.8278281422169573, "ground_truth": 0}, {"key": "9d7fc7fd9ffbfecb1c458b9929fa02e6c3538368", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.8322366570482993, "ground_truth": 0}, {"key": "9d7fc7fd9ffbfecb1c458b9929fa02e6c3538368", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.7620701166338762, "ground_truth": 0}, {"key": "9d7fc7fd9ffbfecb1c458b9929fa02e6c3538368", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.7170118745108075, "ground_truth": 0}, {"key": "30cb674030b01014d2c87b92f09152857e249631", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.750552729484582, "ground_truth": 0}, {"key": "30cb674030b01014d2c87b92f09152857e249631", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.8499711877704922, "ground_truth": 0}, {"key": "30cb674030b01014d2c87b92f09152857e249631", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.7879311958767313, "ground_truth": 0}, {"key": "30cb674030b01014d2c87b92f09152857e249631", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.7057850606763979, "ground_truth": 0}, {"key": "30cb674030b01014d2c87b92f09152857e249631", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.7520125674849298, "ground_truth": 0}, {"key": "d41dc7fc05273a37f0aceaf4f3e35a187f12653e", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.7074046964204974, "ground_truth": 0}, {"key": "d41dc7fc05273a37f0aceaf4f3e35a187f12653e", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.31573596117295794, "ground_truth": 0}, {"key": "d41dc7fc05273a37f0aceaf4f3e35a187f12653e", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.6297746257064519, "ground_truth": 0}, {"key": "d41dc7fc05273a37f0aceaf4f3e35a187f12653e", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.4282333939621549, "ground_truth": 0}, {"key": "d41dc7fc05273a37f0aceaf4f3e35a187f12653e", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.6113819755681955, "ground_truth": 0}, {"key": "fbc6a4d0697b2a3e8b549dcb1f80a8ce7bf47e34", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.9353465162328523, "ground_truth": 0}, {"key": "fbc6a4d0697b2a3e8b549dcb1f80a8ce7bf47e34", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.9425067182956294, "ground_truth": 0}, {"key": "fbc6a4d0697b2a3e8b549dcb1f80a8ce7bf47e34", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.8925625214351981, "ground_truth": 0}, {"key": "fbc6a4d0697b2a3e8b549dcb1f80a8ce7bf47e34", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.8799743794130794, "ground_truth": 0}, {"key": "fbc6a4d0697b2a3e8b549dcb1f80a8ce7bf47e34", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.9329437087148429, "ground_truth": 0}, {"key": "0753a471e6908c35bcbc2daa37e21f3a8443b590", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.8539127620764361, "ground_truth": 0}, {"key": "0753a471e6908c35bcbc2daa37e21f3a8443b590", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.7853085758332186, "ground_truth": 0}, {"key": "0753a471e6908c35bcbc2daa37e21f3a8443b590", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.849971175308549, "ground_truth": 0}, {"key": "0753a471e6908c35bcbc2daa37e21f3a8443b590", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.8175744882927589, "ground_truth": 0}, {"key": "0753a471e6908c35bcbc2daa37e21f3a8443b590", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.8344068857812976, "ground_truth": 0}, {"key": "08450c1bc03472825196be1acb02ac0e13bef939", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.37570648352560776, "ground_truth": 0}, {"key": "08450c1bc03472825196be1acb02ac0e13bef939", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.5350984383262363, "ground_truth": 0}, {"key": "08450c1bc03472825196be1acb02ac0e13bef939", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.7295197686789879, "ground_truth": 0}, {"key": "08450c1bc03472825196be1acb02ac0e13bef939", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.8449215247352581, "ground_truth": 0}, {"key": "08450c1bc03472825196be1acb02ac0e13bef939", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.6566582488128193, "ground_truth": 0}, {"key": "7fa8d9beca50155fd3d71a9087a4311ce321c34b", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.8104789096595174, "ground_truth": 0}, {"key": "7fa8d9beca50155fd3d71a9087a4311ce321c34b", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.5926665968788558, "ground_truth": 0}, {"key": "7fa8d9beca50155fd3d71a9087a4311ce321c34b", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.7154240077051262, "ground_truth": 0}, {"key": "7fa8d9beca50155fd3d71a9087a4311ce321c34b", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.7786493310975254, "ground_truth": 0}, {"key": "7fa8d9beca50155fd3d71a9087a4311ce321c34b", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.7279754526003471, "ground_truth": 0}, {"key": "414a5b8ecbe189d2767c75b839775a1dcafaf4d3", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.6113819942833909, "ground_truth": 0}, {"key": "414a5b8ecbe189d2767c75b839775a1dcafaf4d3", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.5888891349349138, "ground_truth": 0}, {"key": "414a5b8ecbe189d2767c75b839775a1dcafaf4d3", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.3720488046690547, "ground_truth": 0}, {"key": "414a5b8ecbe189d2767c75b839775a1dcafaf4d3", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.23792991193178756, "ground_truth": 0}, {"key": "414a5b8ecbe189d2767c75b839775a1dcafaf4d3", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.4092208031301459, "ground_truth": 0}, {"key": "cac7a712935380d74410a7cba8d406235d51249a", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.4960938498156885, "ground_truth": 0}, {"key": "cac7a712935380d74410a7cba8d406235d51249a", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.3998116438168902, "ground_truth": 0}, {"key": "cac7a712935380d74410a7cba8d406235d51249a", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.4726834677178366, "ground_truth": 0}, {"key": "cac7a712935380d74410a7cba8d406235d51249a", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.6424324819759285, "ground_truth": 0}, {"key": "cac7a712935380d74410a7cba8d406235d51249a", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.513668468742442, "ground_truth": 0}, {"key": "e9093ca0a82f2aba28cd2762942c04177cfbb000", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.800691986669628, "ground_truth": 0}, {"key": "e9093ca0a82f2aba28cd2762942c04177cfbb000", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.8333245926471304, "ground_truth": 0}, {"key": "e9093ca0a82f2aba28cd2762942c04177cfbb000", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.6774740371736554, "ground_truth": 0}, {"key": "e9093ca0a82f2aba28cd2762942c04177cfbb000", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.7057850296866806, "ground_truth": 0}, {"key": "e9093ca0a82f2aba28cd2762942c04177cfbb000", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.7759445415052965, "ground_truth": 0}, {"key": "55a6aabd120f0b18297f7efe22452f9b3aca0d8d", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.9425067246778545, "ground_truth": 0}, {"key": "55a6aabd120f0b18297f7efe22452f9b3aca0d8d", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.9852713852128274, "ground_truth": 0}, {"key": "55a6aabd120f0b18297f7efe22452f9b3aca0d8d", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.8459424391303445, "ground_truth": 0}, {"key": "55a6aabd120f0b18297f7efe22452f9b3aca0d8d", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.9572778028833866, "ground_truth": 0}, {"key": "55a6aabd120f0b18297f7efe22452f9b3aca0d8d", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.9829546830255363, "ground_truth": 0}, {"key": "06bc2f0272d033b123e9eebbb221c62d7d51c283", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.3793783999697778, "ground_truth": 0}, {"key": "06bc2f0272d033b123e9eebbb221c62d7d51c283", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.31405055481968935, "ground_truth": 0}, {"key": "06bc2f0272d033b123e9eebbb221c62d7d51c283", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.1613202438807745, "ground_truth": 0}, {"key": "06bc2f0272d033b123e9eebbb221c62d7d51c283", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.20561503164480185, "ground_truth": 0}, {"key": "06bc2f0272d033b123e9eebbb221c62d7d51c283", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.25091278526050315, "ground_truth": 0}, {"key": "17e43e8e7d2bbbb237df78537d108c3fa917d9fb", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.991083873103393, "ground_truth": 0}, {"key": "17e43e8e7d2bbbb237df78537d108c3fa917d9fb", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.9872772915468472, "ground_truth": 0}, {"key": "17e43e8e7d2bbbb237df78537d108c3fa917d9fb", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.9815951096189988, "ground_truth": 0}, {"key": "17e43e8e7d2bbbb237df78537d108c3fa917d9fb", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.9830850873326149, "ground_truth": 0}, {"key": "17e43e8e7d2bbbb237df78537d108c3fa917d9fb", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.9886682452838462, "ground_truth": 0}, {"key": "ddcdeb9bdd19fa23f9495c85d48eeee910f33102", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.7233094861450938, "ground_truth": 0}, {"key": "ddcdeb9bdd19fa23f9495c85d48eeee910f33102", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.7606506521051989, "ground_truth": 0}, {"key": "ddcdeb9bdd19fa23f9495c85d48eeee910f33102", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.6909763095990327, "ground_truth": 0}, {"key": "ddcdeb9bdd19fa23f9495c85d48eeee910f33102", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.5019531184671527, "ground_truth": 0}, {"key": "ddcdeb9bdd19fa23f9495c85d48eeee910f33102", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.4513265055731021, "ground_truth": 0}, {"key": "ee0ba7928d8987f2cb21c9a2012a76730f77de45", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.25982564483399373, "ground_truth": 0}, {"key": "ee0ba7928d8987f2cb21c9a2012a76730f77de45", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.3040416838869656, "ground_truth": 0}, {"key": "ee0ba7928d8987f2cb21c9a2012a76730f77de45", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.5888891349651573, "ground_truth": 0}, {"key": "ee0ba7928d8987f2cb21c9a2012a76730f77de45", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.3415824984718155, "ground_truth": 0}, {"key": "ee0ba7928d8987f2cb21c9a2012a76730f77de45", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.2829881258909448, "ground_truth": 0}, {"key": "554fd99f28ae12472c5d99ef6383bb184744c25a", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.6909762938378108, "ground_truth": 0}, {"key": "554fd99f28ae12472c5d99ef6383bb184744c25a", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.6388352875193204, "ground_truth": 0}, {"key": "554fd99f28ae12472c5d99ef6383bb184744c25a", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.5544704489417873, "ground_truth": 0}, {"key": "554fd99f28ae12472c5d99ef6383bb184744c25a", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.774583384971172, "ground_truth": 0}, {"key": "554fd99f28ae12472c5d99ef6383bb184744c25a", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.6774740192440982, "ground_truth": 0}, {"key": "9e141ebc1c06d483bf85f4e5c8b3c7bc2d00ea2f", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.7356416242389417, "ground_truth": 0}, {"key": "9e141ebc1c06d483bf85f4e5c8b3c7bc2d00ea2f", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.5058591228416729, "ground_truth": 0}, {"key": "9e141ebc1c06d483bf85f4e5c8b3c7bc2d00ea2f", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.4416730236087609, "ground_truth": 0}, {"key": "9e141ebc1c06d483bf85f4e5c8b3c7bc2d00ea2f", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.6442251088003408, "ground_truth": 0}, {"key": "9e141ebc1c06d483bf85f4e5c8b3c7bc2d00ea2f", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.5467381586077805, "ground_truth": 0}, {"key": "c9160e2f5ce386dabb10517e7a5c0933c01a9546", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.5525396979286188, "ground_truth": 0}, {"key": "c9160e2f5ce386dabb10517e7a5c0933c01a9546", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.7025300457156238, "ground_truth": 0}, {"key": "c9160e2f5ce386dabb10517e7a5c0933c01a9546", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.5640984934051464, "ground_truth": 0}, {"key": "c9160e2f5ce386dabb10517e7a5c0933c01a9546", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.3647775640938955, "ground_truth": 0}, {"key": "c9160e2f5ce386dabb10517e7a5c0933c01a9546", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.4205995810279007, "ground_truth": 0}, {"key": "d256aee1a47eb5b489dee6fb72ab7f7d1483a37f", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.44939264675355, "ground_truth": 0}, {"key": "d256aee1a47eb5b489dee6fb72ab7f7d1483a37f", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.5253688285615972, "ground_truth": 0}, {"key": "d256aee1a47eb5b489dee6fb72ab7f7d1483a37f", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.28937170091825, "ground_truth": 0}, {"key": "d256aee1a47eb5b489dee6fb72ab7f7d1483a37f", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.4804786970181734, "ground_truth": 0}, {"key": "d256aee1a47eb5b489dee6fb72ab7f7d1483a37f", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.45519859981904826, "ground_truth": 0}, {"key": "2fff2bc541ef34a6647dfa2e4294cdcc187e47b9", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.5058591040005455, "ground_truth": 0}, {"key": "2fff2bc541ef34a6647dfa2e4294cdcc187e47b9", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.5058591263399504, "ground_truth": 0}, {"key": "2fff2bc541ef34a6647dfa2e4294cdcc187e47b9", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.26133092581758594, "ground_truth": 0}, {"key": "2fff2bc541ef34a6647dfa2e4294cdcc187e47b9", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.39606815678817087, "ground_truth": 0}, {"key": "2fff2bc541ef34a6647dfa2e4294cdcc187e47b9", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.36296922183451963, "ground_truth": 0}, {"key": "677375a4c69e81ab623af7c06a6b0a8d03d6350e", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.4726834707160258, "ground_truth": 0}, {"key": "677375a4c69e81ab623af7c06a6b0a8d03d6350e", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.3522017912118455, "ground_truth": 0}, {"key": "677375a4c69e81ab623af7c06a6b0a8d03d6350e", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.4397473431930233, "ground_truth": 0}, {"key": "677375a4c69e81ab623af7c06a6b0a8d03d6350e", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.297469952322382, "ground_truth": 0}, {"key": "677375a4c69e81ab623af7c06a6b0a8d03d6350e", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.37387581744523835, "ground_truth": 0}, {"key": "33530f97118cc905b05cb920671492c7bfdf3a3b", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.7505527582736907, "ground_truth": 0}, {"key": "33530f97118cc905b05cb920671492c7bfdf3a3b", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.737158141498082, "ground_truth": 0}, {"key": "33530f97118cc905b05cb920671492c7bfdf3a3b", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.5945512417001524, "ground_truth": 0}, {"key": "33530f97118cc905b05cb920671492c7bfdf3a3b", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.6825737425281707, "ground_truth": 0}, {"key": "33530f97118cc905b05cb920671492c7bfdf3a3b", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.5448013928912716, "ground_truth": 0}, {"key": "3c19a753303ae0d67b3ae28e070c0f4157ffc52d", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.5869964139637299, "ground_truth": 0}, {"key": "3c19a753303ae0d67b3ae28e070c0f4157ffc52d", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.7799928887384011, "ground_truth": 0}, {"key": "3c19a753303ae0d67b3ae28e070c0f4157ffc52d", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.6740504829297465, "ground_truth": 0}, {"key": "3c19a753303ae0d67b3ae28e070c0f4157ffc52d", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.5273165280906342, "ground_truth": 0}, {"key": "3c19a753303ae0d67b3ae28e070c0f4157ffc52d", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.5370413698343071, "ground_truth": 0}, {"key": "9313988d26672c576f08e130c895edf20d8aa626", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.6859494571549027, "ground_truth": 0}, {"key": "9313988d26672c576f08e130c895edf20d8aa626", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.4244119986901797, "ground_truth": 0}, {"key": "9313988d26672c576f08e130c895edf20d8aa626", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.6619228703491684, "ground_truth": 0}, {"key": "9313988d26672c576f08e130c895edf20d8aa626", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.7248702709725467, "ground_truth": 0}, {"key": "9313988d26672c576f08e130c895edf20d8aa626", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.737158145546666, "ground_truth": 0}, {"key": "72f4a6670ec7ec915c83d58bb0ebf152b1605bb6", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.7401743694427351, "ground_truth": 0}, {"key": "72f4a6670ec7ec915c83d58bb0ebf152b1605bb6", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.9019206760841466, "ground_truth": 0}, {"key": "72f4a6670ec7ec915c83d58bb0ebf152b1605bb6", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.8840392746558846, "ground_truth": 0}, {"key": "72f4a6670ec7ec915c83d58bb0ebf152b1605bb6", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.7994423193906619, "ground_truth": 0}, {"key": "72f4a6670ec7ec915c83d58bb0ebf152b1605bb6", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.9167080742044734, "ground_truth": 0}, {"key": "b73f50e29d5b2943eb315643bef8ee4e09f5605b", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.2766905340594306, "ground_truth": 0}, {"key": "b73f50e29d5b2943eb315643bef8ee4e09f5605b", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.2281564911824796, "ground_truth": 0}, {"key": "b73f50e29d5b2943eb315643bef8ee4e09f5605b", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.2267836351022643, "ground_truth": 0}, {"key": "b73f50e29d5b2943eb315643bef8ee4e09f5605b", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.1755380755990158, "ground_truth": 0}, {"key": "b73f50e29d5b2943eb315643bef8ee4e09f5605b", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.24364244480890956, "ground_truth": 0}, {"key": "f9689fb9656132e1c6d186851563f2b968643791", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.36116472125724747, "ground_truth": 0}, {"key": "f9689fb9656132e1c6d186851563f2b968643791", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.3140505567025982, "ground_truth": 0}, {"key": "f9689fb9656132e1c6d186851563f2b968643791", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.21601152263887402, "ground_truth": 0}, {"key": "f9689fb9656132e1c6d186851563f2b968643791", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.43398146218422845, "ground_truth": 0}, {"key": "f9689fb9656132e1c6d186851563f2b968643791", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.2523840492368387, "ground_truth": 0}, {"key": "63831b842812b1a3d05b04904a10d160fe7ad2af", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.7264255973677896, "ground_truth": 0}, {"key": "63831b842812b1a3d05b04904a10d160fe7ad2af", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.7718435009742115, "ground_truth": 0}, {"key": "63831b842812b1a3d05b04904a10d160fe7ad2af", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.732591824203448, "ground_truth": 0}, {"key": "63831b842812b1a3d05b04904a10d160fe7ad2af", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.8679338448639324, "ground_truth": 0}, {"key": "63831b842812b1a3d05b04904a10d160fe7ad2af", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.724870268535512, "ground_truth": 0}, {"key": "05688bac0e46542be65a6df240428a6f26c86fd0", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.9612438053017265, "ground_truth": 0}, {"key": "05688bac0e46542be65a6df240428a6f26c86fd0", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.9394706095830764, "ground_truth": 0}, {"key": "05688bac0e46542be65a6df240428a6f26c86fd0", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.9039745150185317, "ground_truth": 0}, {"key": "05688bac0e46542be65a6df240428a6f26c86fd0", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.9504109777084218, "ground_truth": 0}, {"key": "05688bac0e46542be65a6df240428a6f26c86fd0", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.9453993931705339, "ground_truth": 0}, {"key": "5ba0d22ccba29ac8a3c77da069165d6016f5a214", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.41300357163104484, "ground_truth": 0}, {"key": "5ba0d22ccba29ac8a3c77da069165d6016f5a214", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.39233683178689577, "ground_truth": 0}, {"key": "5ba0d22ccba29ac8a3c77da069165d6016f5a214", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.264358366861575, "ground_truth": 0}, {"key": "5ba0d22ccba29ac8a3c77da069165d6016f5a214", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.23651623393200089, "ground_truth": 0}, {"key": "5ba0d22ccba29ac8a3c77da069165d6016f5a214", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.32594952941586836, "ground_truth": 0}, {"key": "9f63d6256158d260c426a9336d19b760d9bc5a48", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.47657966820129966, "ground_truth": 0}, {"key": "9f63d6256158d260c426a9336d19b760d9bc5a48", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.33285234389884877, "ground_truth": 0}, {"key": "9f63d6256158d260c426a9336d19b760d9bc5a48", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.28457599934199707, "ground_truth": 0}, {"key": "9f63d6256158d260c426a9336d19b760d9bc5a48", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.17781087671755286, "ground_truth": 0}, {"key": "9f63d6256158d260c426a9336d19b760d9bc5a48", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.5409238404900105, "ground_truth": 0}, {"key": "fb6516de631cade629b797e8f40f377523c4aa0e", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.7772998559374357, "ground_truth": 0}, {"key": "fb6516de631cade629b797e8f40f377523c4aa0e", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.8386797609789831, "ground_truth": 0}, {"key": "fb6516de631cade629b797e8f40f377523c4aa0e", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.8749346148782909, "ground_truth": 0}, {"key": "fb6516de631cade629b797e8f40f377523c4aa0e", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.6688802704459379, "ground_truth": 0}, {"key": "fb6516de631cade629b797e8f40f377523c4aa0e", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.8322366554746238, "ground_truth": 0}, {"key": "0a71f063b78184b4ca2ffee3c642d48dc27ef91b", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.36296920137276156, "ground_truth": 0}, {"key": "0a71f063b78184b4ca2ffee3c642d48dc27ef91b", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.30569731452356125, "ground_truth": 0}, {"key": "0a71f063b78184b4ca2ffee3c642d48dc27ef91b", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.41300357241200625, "ground_truth": 0}, {"key": "0a71f063b78184b4ca2ffee3c642d48dc27ef91b", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.2991051896769375, "ground_truth": 0}, {"key": "0a71f063b78184b4ca2ffee3c642d48dc27ef91b", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.4397473717311818, "ground_truth": 0}, {"key": "700e0d133d2f5c2e65960aae7bffa66bb62c0df4", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.4863315468601629, "ground_truth": 0}, {"key": "700e0d133d2f5c2e65960aae7bffa66bb62c0df4", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.5563995996642788, "ground_truth": 0}, {"key": "700e0d133d2f5c2e65960aae7bffa66bb62c0df4", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.5389832385474603, "ground_truth": 0}, {"key": "700e0d133d2f5c2e65960aae7bffa66bb62c0df4", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.5717666096212396, "ground_truth": 0}, {"key": "700e0d133d2f5c2e65960aae7bffa66bb62c0df4", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.5621764964439102, "ground_truth": 0}, {"key": "180642a2ddfce93ceaf3ee3ec4779400fe67ae1e", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.6636689642821801, "ground_truth": 0}, {"key": "180642a2ddfce93ceaf3ee3ec4779400fe67ae1e", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.6976089249831737, "ground_truth": 0}, {"key": "180642a2ddfce93ceaf3ee3ec4779400fe67ae1e", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.7662936364749058, "ground_truth": 0}, {"key": "180642a2ddfce93ceaf3ee3ec4779400fe67ae1e", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.5679366069198553, "ground_truth": 0}, {"key": "180642a2ddfce93ceaf3ee3ec4779400fe67ae1e", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.7217431980355893, "ground_truth": 0}, {"key": "3e868fbad714ceab14a41fa9dd5d8a40204f2199", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.7956580823539043, "ground_truth": 0}, {"key": "3e868fbad714ceab14a41fa9dd5d8a40204f2199", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.45326188570627324, "ground_truth": 0}, {"key": "3e868fbad714ceab14a41fa9dd5d8a40204f2199", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.47463120168760353, "ground_truth": 0}, {"key": "3e868fbad714ceab14a41fa9dd5d8a40204f2199", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.6224593054725425, "ground_truth": 0}, {"key": "3e868fbad714ceab14a41fa9dd5d8a40204f2199", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.38491214185509615, "ground_truth": 0}, {"key": "8b0a818edcbbefb79dd40a19b08119f6848083db", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.4532618373802085, "ground_truth": 0}, {"key": "8b0a818edcbbefb79dd40a19b08119f6848083db", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.33285234389884877, "ground_truth": 0}, {"key": "8b0a818edcbbefb79dd40a19b08119f6848083db", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.21733751061719994, "ground_truth": 0}, {"key": "8b0a818edcbbefb79dd40a19b08119f6848083db", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.41111085830638416, "ground_truth": 0}, {"key": "8b0a818edcbbefb79dd40a19b08119f6848083db", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.5926665948149865, "ground_truth": 0}, {"key": "ceb7a288ac1ad604a17bc25c5978fcc87b1a4446", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.46490158725606995, "ground_truth": 0}, {"key": "ceb7a288ac1ad604a17bc25c5978fcc87b1a4446", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.31742628241721826, "ground_truth": 0}, {"key": "ceb7a288ac1ad604a17bc25c5978fcc87b1a4446", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.6001883606031748, "ground_truth": 0}, {"key": "ceb7a288ac1ad604a17bc25c5978fcc87b1a4446", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.49414086883065583, "ground_truth": 0}, {"key": "ceb7a288ac1ad604a17bc25c5978fcc87b1a4446", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.5389832442153363, "ground_truth": 0}, {"key": "a228e744966fe03eca515b971329acacf9feabb2", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.6531268987222613, "ground_truth": 0}, {"key": "a228e744966fe03eca515b971329acacf9feabb2", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.7634837679890842, "ground_truth": 0}, {"key": "a228e744966fe03eca515b971329acacf9feabb2", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.6688802622728608, "ground_truth": 0}, {"key": "a228e744966fe03eca515b971329acacf9feabb2", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.5156199060537787, "ground_truth": 0}, {"key": "a228e744966fe03eca515b971329acacf9feabb2", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.8140527949232548, "ground_truth": 0}, {"key": "c44238ec87e7fc40ab7fe6e724cfcbf301e01216", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.6297746407374805, "ground_truth": 0}, {"key": "c44238ec87e7fc40ab7fe6e724cfcbf301e01216", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.6548947119869022, "ground_truth": 0}, {"key": "c44238ec87e7fc40ab7fe6e724cfcbf301e01216", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.6224593341678362, "ground_truth": 0}, {"key": "c44238ec87e7fc40ab7fe6e724cfcbf301e01216", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.6001883695599152, "ground_truth": 0}, {"key": "c44238ec87e7fc40ab7fe6e724cfcbf301e01216", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.699254403806067, "ground_truth": 0}, {"key": "fff32094b00f3780cc98fe43bd98aace4b851281", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.8740772414388963, "ground_truth": 0}, {"key": "fff32094b00f3780cc98fe43bd98aace4b851281", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.8624675424129965, "ground_truth": 0}, {"key": "fff32094b00f3780cc98fe43bd98aace4b851281", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.49218814127063815, "ground_truth": 0}, {"key": "fff32094b00f3780cc98fe43bd98aace4b851281", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.842863145034441, "ground_truth": 0}, {"key": "fff32094b00f3780cc98fe43bd98aace4b851281", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.7461389943508617, "ground_truth": 0}, {"key": "373ef5be1d84b8c4905193e569e0cf8a7ead3d03", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.4263215955662986, "ground_truth": 0}, {"key": "373ef5be1d84b8c4905193e569e0cf8a7ead3d03", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.43974735321775893, "ground_truth": 0}, {"key": "373ef5be1d84b8c4905193e569e0cf8a7ead3d03", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.5097644011653526, "ground_truth": 0}, {"key": "373ef5be1d84b8c4905193e569e0cf8a7ead3d03", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.6352224575737394, "ground_truth": 0}, {"key": "373ef5be1d84b8c4905193e569e0cf8a7ead3d03", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.3629691954991978, "ground_truth": 0}, {"key": "f372b28e3d1f74d60aa8ee29d7bdd49a6e7f9779", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.9750122045057596, "ground_truth": 0}, {"key": "f372b28e3d1f74d60aa8ee29d7bdd49a6e7f9779", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.9848109511846944, "ground_truth": 0}, {"key": "f372b28e3d1f74d60aa8ee29d7bdd49a6e7f9779", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.941654160624145, "ground_truth": 0}, {"key": "f372b28e3d1f74d60aa8ee29d7bdd49a6e7f9779", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.9876638982887094, "ground_truth": 0}, {"key": "f372b28e3d1f74d60aa8ee29d7bdd49a6e7f9779", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.9702399058075122, "ground_truth": 0}, {"key": "fbcaa7519e9ff82193afbaed67d8706f2350125f", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.8624675321113088, "ground_truth": 0}, {"key": "fbcaa7519e9ff82193afbaed67d8706f2350125f", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.8092759881708518, "ground_truth": 0}, {"key": "fbcaa7519e9ff82193afbaed67d8706f2350125f", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.7634837743214091, "ground_truth": 0}, {"key": "fbcaa7519e9ff82193afbaed67d8706f2350125f", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.7931059514629892, "ground_truth": 0}, {"key": "fbcaa7519e9ff82193afbaed67d8706f2350125f", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.581303090932002, "ground_truth": 0}, {"key": "5ebd041d89a2ba41b387c30293f0657eef746910", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.5755880258844566, "ground_truth": 0}, {"key": "5ebd041d89a2ba41b387c30293f0657eef746910", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.33633107682619645, "ground_truth": 0}, {"key": "5ebd041d89a2ba41b387c30293f0657eef746910", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.5525397242350314, "ground_truth": 0}, {"key": "5ebd041d89a2ba41b387c30293f0657eef746910", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.6039318222316394, "ground_truth": 0}, {"key": "5ebd041d89a2ba41b387c30293f0657eef746910", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.43014736612561033, "ground_truth": 0}, {"key": "ac4ae79796d05506dabe4380c24f7dd423e09965", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.46295857737122, "ground_truth": 0}, {"key": "ac4ae79796d05506dabe4380c24f7dd423e09965", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.6187804394209121, "ground_truth": 0}, {"key": "ac4ae79796d05506dabe4380c24f7dd423e09965", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.4016877911418774, "ground_truth": 0}, {"key": "ac4ae79796d05506dabe4380c24f7dd423e09965", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.5331543905594578, "ground_truth": 0}, {"key": "ac4ae79796d05506dabe4380c24f7dd423e09965", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.76768984601137, "ground_truth": 0}, {"key": "62827a1a377491d88adcbac25ecf14a64b5f997b", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.8198933368889688, "ground_truth": 0}, {"key": "62827a1a377491d88adcbac25ecf14a64b5f997b", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.847967751649846, "ground_truth": 0}, {"key": "62827a1a377491d88adcbac25ecf14a64b5f997b", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.9207896826442733, "ground_truth": 0}, {"key": "62827a1a377491d88adcbac25ecf14a64b5f997b", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.6909762976696393, "ground_truth": 0}, {"key": "62827a1a377491d88adcbac25ecf14a64b5f997b", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.6740504750976509, "ground_truth": 0}, {"key": "d42463e1093a92ec4dbd20edd8f4bf3306f00f3f", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.2107662994415278, "ground_truth": 0}, {"key": "d42463e1093a92ec4dbd20edd8f4bf3306f00f3f", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.3451052905606313, "ground_truth": 0}, {"key": "d42463e1093a92ec4dbd20edd8f4bf3306f00f3f", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.11279540206956574, "ground_truth": 0}, {"key": "d42463e1093a92ec4dbd20edd8f4bf3306f00f3f", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.32766830860730384, "ground_truth": 0}, {"key": "d42463e1093a92ec4dbd20edd8f4bf3306f00f3f", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.13117322627382844, "ground_truth": 0}, {"key": "4b0eda92463958cce8c6b2537db39088e1254552", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.5717666021883784, "ground_truth": 0}, {"key": "4b0eda92463958cce8c6b2537db39088e1254552", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.74017437538007, "ground_truth": 0}, {"key": "4b0eda92463958cce8c6b2537db39088e1254552", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.700894804163418, "ground_truth": 0}, {"key": "4b0eda92463958cce8c6b2537db39088e1254552", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.8056321815127512, "ground_truth": 0}, {"key": "4b0eda92463958cce8c6b2537db39088e1254552", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.6976089018424221, "ground_truth": 0}, {"key": "e117408ad19cc69e15b1e21b9ae54f10c07223ce", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.8152324840622539, "ground_truth": 0}, {"key": "e117408ad19cc69e15b1e21b9ae54f10c07223ce", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.8469578489658729, "ground_truth": 0}, {"key": "e117408ad19cc69e15b1e21b9ae54f10c07223ce", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.5058591064752147, "ground_truth": 0}, {"key": "e117408ad19cc69e15b1e21b9ae54f10c07223ce", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.7233094666899494, "ground_truth": 0}, {"key": "e117408ad19cc69e15b1e21b9ae54f10c07223ce", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.8679338408906736, "ground_truth": 0}, {"key": "3c5b68b58c34853baa534d1265ec7fde00d4eb4e", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.7799928851640788, "ground_truth": 0}, {"key": "3c5b68b58c34853baa534d1265ec7fde00d4eb4e", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.8092759722143674, "ground_truth": 0}, {"key": "3c5b68b58c34853baa534d1265ec7fde00d4eb4e", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.7826624874312912, "ground_truth": 0}, {"key": "3c5b68b58c34853baa534d1265ec7fde00d4eb4e", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.5832033593901682, "ground_truth": 0}, {"key": "3c5b68b58c34853baa534d1265ec7fde00d4eb4e", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.8509647155496741, "ground_truth": 0}, {"key": "6c3d2feed04c75063d182103f0585c45da9aaa1b", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.6352224278409312, "ground_truth": 0}, {"key": "6c3d2feed04c75063d182103f0585c45da9aaa1b", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.3647775609944559, "ground_truth": 0}, {"key": "6c3d2feed04c75063d182103f0585c45da9aaa1b", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.4416730095497582, "ground_truth": 0}, {"key": "6c3d2feed04c75063d182103f0585c45da9aaa1b", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.43782348940147675, "ground_truth": 0}, {"key": "6c3d2feed04c75063d182103f0585c45da9aaa1b", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.30074559694371317, "ground_truth": 0}, {"key": "4fa1c0bd7f86368d7ae7730d95ff7e73dc9172da", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.7931059504830892, "ground_truth": 0}, {"key": "4fa1c0bd7f86368d7ae7730d95ff7e73dc9172da", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.8824278610505644, "ground_truth": 0}, {"key": "4fa1c0bd7f86368d7ae7730d95ff7e73dc9172da", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.879974374486239, "ground_truth": 0}, {"key": "4fa1c0bd7f86368d7ae7730d95ff7e73dc9172da", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.8407825871120889, "ground_truth": 0}, {"key": "4fa1c0bd7f86368d7ae7730d95ff7e73dc9172da", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.8529354672575274, "ground_truth": 0}, {"key": "282f1910bd57e50d4401c695ebe75b817de68548", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.8606036191353237, "ground_truth": 0}, {"key": "282f1910bd57e50d4401c695ebe75b817de68548", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.8895288435691746, "ground_truth": 0}, {"key": "282f1910bd57e50d4401c695ebe75b817de68548", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.9385759602942817, "ground_truth": 0}, {"key": "282f1910bd57e50d4401c695ebe75b817de68548", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.891054949376759, "ground_truth": 0}, {"key": "282f1910bd57e50d4401c695ebe75b817de68548", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.9019206680567167, "ground_truth": 0}, {"key": "af2d712599be471d1ba0b91fa18c347220ca595d", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.6242935335493741, "ground_truth": 0}, {"key": "af2d712599be471d1ba0b91fa18c347220ca595d", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.5926666016422122, "ground_truth": 0}, {"key": "af2d712599be471d1ba0b91fa18c347220ca595d", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.5350984316321235, "ground_truth": 0}, {"key": "af2d712599be471d1ba0b91fa18c347220ca595d", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.3960681760031827, "ground_truth": 0}, {"key": "af2d712599be471d1ba0b91fa18c347220ca595d", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.8104789103555892, "ground_truth": 0}, {"key": "e3dd06d326c8d53722bdc5c8428e29c68a60d0d5", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.5888891533595246, "ground_truth": 0}, {"key": "e3dd06d326c8d53722bdc5c8428e29c68a60d0d5", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.7264256057838387, "ground_truth": 0}, {"key": "e3dd06d326c8d53722bdc5c8428e29c68a60d0d5", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.6976089073841284, "ground_truth": 0}, {"key": "e3dd06d326c8d53722bdc5c8428e29c68a60d0d5", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.4339814624853073, "ground_truth": 0}, {"key": "e3dd06d326c8d53722bdc5c8428e29c68a60d0d5", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.6584174942747051, "ground_truth": 0}, {"key": "493fa8c40d1bc26ed1d25633c779b13bc33efdba", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.7772998556915275, "ground_truth": 0}, {"key": "493fa8c40d1bc26ed1d25633c779b13bc33efdba", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.76348376592697, "ground_truth": 0}, {"key": "493fa8c40d1bc26ed1d25633c779b13bc33efdba", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.8104789282311693, "ground_truth": 0}, {"key": "493fa8c40d1bc26ed1d25633c779b13bc33efdba", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.616935801845815, "ground_truth": 0}, {"key": "493fa8c40d1bc26ed1d25633c779b13bc33efdba", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.5117166001474108, "ground_truth": 0}, {"key": "56d7d67bb0fc32ee71cc006b915244776d883661", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.7577943617467855, "ground_truth": 0}, {"key": "56d7d67bb0fc32ee71cc006b915244776d883661", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.5660185373042583, "ground_truth": 0}, {"key": "56d7d67bb0fc32ee71cc006b915244776d883661", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.455198616284932, "ground_truth": 0}, {"key": "56d7d67bb0fc32ee71cc006b915244776d883661", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.5214711571030003, "ground_truth": 0}, {"key": "56d7d67bb0fc32ee71cc006b915244776d883661", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.44939263799375484, "ground_truth": 0}, {"key": "2b08ee205946dc0bb6ffe0db654cbbba1199eb28", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.8233284025442562, "ground_truth": 0}, {"key": "2b08ee205946dc0bb6ffe0db654cbbba1199eb28", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.7759445603403937, "ground_truth": 0}, {"key": "2b08ee205946dc0bb6ffe0db654cbbba1199eb28", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.767689861976809, "ground_truth": 0}, {"key": "2b08ee205946dc0bb6ffe0db654cbbba1199eb28", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.8300437616602837, "ground_truth": 0}, {"key": "2b08ee205946dc0bb6ffe0db654cbbba1199eb28", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.710628327225141, "ground_truth": 0}, {"key": "782c4bdaee73189103d2e05748717b3ea0e89e5d", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.8984105599041265, "ground_truth": 0}, {"key": "782c4bdaee73189103d2e05748717b3ea0e89e5d", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.8824278808736785, "ground_truth": 0}, {"key": "782c4bdaee73189103d2e05748717b3ea0e89e5d", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.7264256201394861, "ground_truth": 0}, {"key": "782c4bdaee73189103d2e05748717b3ea0e89e5d", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.7461390147340775, "ground_truth": 0}, {"key": "782c4bdaee73189103d2e05748717b3ea0e89e5d", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.8175744634624791, "ground_truth": 0}, {"key": "87385fb51ac9eaf76e8421723c94410f724750fc", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.6242935576539748, "ground_truth": 0}, {"key": "87385fb51ac9eaf76e8421723c94410f724750fc", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.6876299789923171, "ground_truth": 0}, {"key": "87385fb51ac9eaf76e8421723c94410f724750fc", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.6548947118775635, "ground_truth": 0}, {"key": "87385fb51ac9eaf76e8421723c94410f724750fc", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.5409238521972617, "ground_truth": 0}, {"key": "87385fb51ac9eaf76e8421723c94410f724750fc", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.6909762728653767, "ground_truth": 0}, {"key": "20528eb48341b50c0083fcf5a9d114b39040e5c1", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.5774953752983004, "ground_truth": 0}, {"key": "20528eb48341b50c0083fcf5a9d114b39040e5c1", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.7577943832590324, "ground_truth": 0}, {"key": "20528eb48341b50c0083fcf5a9d114b39040e5c1", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.665410528127317, "ground_truth": 0}, {"key": "20528eb48341b50c0083fcf5a9d114b39040e5c1", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.6548947162479367, "ground_truth": 0}, {"key": "20528eb48341b50c0083fcf5a9d114b39040e5c1", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.6976089118084952, "ground_truth": 0}, {"key": "412630c97420afb50e5278d3406e0cf4b08d0b77", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.8080672017405577, "ground_truth": 0}, {"key": "412630c97420afb50e5278d3406e0cf4b08d0b77", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.4726834573317292, "ground_truth": 0}, {"key": "412630c97420afb50e5278d3406e0cf4b08d0b77", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.6334102848939791, "ground_truth": 0}, {"key": "412630c97420afb50e5278d3406e0cf4b08d0b77", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.6825737270392153, "ground_truth": 0}, {"key": "412630c97420afb50e5278d3406e0cf4b08d0b77", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.38491215185355054, "ground_truth": 0}, {"key": "dcd60a85e1e17ec0163a925c9412d480fd08072f", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.6495786130328791, "ground_truth": 0}, {"key": "dcd60a85e1e17ec0163a925c9412d480fd08072f", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.864310461510886, "ground_truth": 0}, {"key": "dcd60a85e1e17ec0163a925c9412d480fd08072f", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.6893056217716708, "ground_truth": 0}, {"key": "dcd60a85e1e17ec0163a925c9412d480fd08072f", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.6859494765673496, "ground_truth": 0}, {"key": "dcd60a85e1e17ec0163a925c9412d480fd08072f", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.6636689491099591, "ground_truth": 0}, {"key": "805644d370fae7b0492174c54c00e86eff742735", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.7931059434721442, "ground_truth": 0}, {"key": "805644d370fae7b0492174c54c00e86eff742735", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.8104789202359395, "ground_truth": 0}, {"key": "805644d370fae7b0492174c54c00e86eff742735", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.4186969157015194, "ground_truth": 0}, {"key": "805644d370fae7b0492174c54c00e86eff742735", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.7248702766033023, "ground_truth": 0}, {"key": "805644d370fae7b0492174c54c00e86eff742735", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.6636689462588731, "ground_truth": 0}, {"key": "3aa0ef8cac31a60076c43a9484792b59372edb64", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.43398148638035866, "ground_truth": 0}, {"key": "3aa0ef8cac31a60076c43a9484792b59372edb64", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.566018536199451, "ground_truth": 0}, {"key": "3aa0ef8cac31a60076c43a9484792b59372edb64", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.4378234903601384, "ground_truth": 0}, {"key": "3aa0ef8cac31a60076c43a9484792b59372edb64", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.36840571601476485, "ground_truth": 0}, {"key": "3aa0ef8cac31a60076c43a9484792b59372edb64", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.6706082941360451, "ground_truth": 0}, {"key": "4cf51ce9372dff8ff7f44f098eab1c1d7569af7a", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.39420094425948876, "ground_truth": 0}, {"key": "4cf51ce9372dff8ff7f44f098eab1c1d7569af7a", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.4804786614897696, "ground_truth": 0}, {"key": "4cf51ce9372dff8ff7f44f098eab1c1d7569af7a", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.5156199168834004, "ground_truth": 0}, {"key": "4cf51ce9372dff8ff7f44f098eab1c1d7569af7a", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.47852882028216354, "ground_truth": 0}, {"key": "4cf51ce9372dff8ff7f44f098eab1c1d7569af7a", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.4824291234023059, "ground_truth": 0}, {"key": "ea06fd0b25cb9793397a51de73fd83f91b4323fa", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.4629586068557974, "ground_truth": 0}, {"key": "ea06fd0b25cb9793397a51de73fd83f91b4323fa", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.7866228083102375, "ground_truth": 0}, {"key": "ea06fd0b25cb9793397a51de73fd83f91b4323fa", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.6671476740648099, "ground_truth": 0}, {"key": "ea06fd0b25cb9793397a51de73fd83f91b4323fa", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.8509647117190601, "ground_truth": 0}, {"key": "ea06fd0b25cb9793397a51de73fd83f91b4323fa", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.6513548529705826, "ground_truth": 0}, {"key": "a150e93fa52eaba281aae9eabe28b3ee4155f296", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.375706481298547, "ground_truth": 0}, {"key": "a150e93fa52eaba281aae9eabe28b3ee4155f296", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.24653332469985806, "ground_truth": 0}, {"key": "a150e93fa52eaba281aae9eabe28b3ee4155f296", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.45519858143745173, "ground_truth": 0}, {"key": "a150e93fa52eaba281aae9eabe28b3ee4155f296", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.44746028766032575, "ground_truth": 0}, {"key": "a150e93fa52eaba281aae9eabe28b3ee4155f296", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.32939174478774325, "ground_truth": 0}, {"key": "a0a84718168357049273f6e65133fd06e67cd6d2", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.8705972757128237, "ground_truth": 0}, {"key": "a0a84718168357049273f6e65133fd06e67cd6d2", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.8661325183921099, "ground_truth": 0}, {"key": "a0a84718168357049273f6e65133fd06e67cd6d2", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.804405912271547, "ground_truth": 0}, {"key": "a0a84718168357049273f6e65133fd06e67cd6d2", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.590779198554942, "ground_truth": 0}, {"key": "a0a84718168357049273f6e65133fd06e67cd6d2", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.8459424454200262, "ground_truth": 0}, {"key": "b5833a27ee69d7540435e3c70af040c2b743f541", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.3849121357949794, "ground_truth": 0}, {"key": "b5833a27ee69d7540435e3c70af040c2b743f541", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.3775406740844345, "ground_truth": 0}, {"key": "b5833a27ee69d7540435e3c70af040c2b743f541", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.6671476923684855, "ground_truth": 0}, {"key": "b5833a27ee69d7540435e3c70af040c2b743f541", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.4824291154772159, "ground_truth": 0}, {"key": "b5833a27ee69d7540435e3c70af040c2b743f541", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.29421497515691214, "ground_truth": 0}, {"key": "98dbba54da2a05bb04320aa0e4fb05fba3d75b63", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.7648916196124672, "ground_truth": 0}, {"key": "98dbba54da2a05bb04320aa0e4fb05fba3d75b63", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.5774953475567498, "ground_truth": 0}, {"key": "98dbba54da2a05bb04320aa0e4fb05fba3d75b63", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.6791786759849593, "ground_truth": 0}, {"key": "98dbba54da2a05bb04320aa0e4fb05fba3d75b63", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.7310585859803275, "ground_truth": 0}, {"key": "98dbba54da2a05bb04320aa0e4fb05fba3d75b63", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.7446563503178981, "ground_truth": 0}, {"key": "4a30d8e9ba08a56c1d503d719525113545c414e3", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.7505527707175234, "ground_truth": 0}, {"key": "4a30d8e9ba08a56c1d503d719525113545c414e3", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.8910549659096474, "ground_truth": 0}, {"key": "4a30d8e9ba08a56c1d503d719525113545c414e3", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.8044059186556966, "ground_truth": 0}, {"key": "4a30d8e9ba08a56c1d503d719525113545c414e3", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.6057990663525038, "ground_truth": 0}, {"key": "4a30d8e9ba08a56c1d503d719525113545c414e3", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.8221891442384244, "ground_truth": 0}, {"key": "c3acabb0c18cc7615eb3796406500fba1b148d3d", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.45326183359098177, "ground_truth": 0}, {"key": "c3acabb0c18cc7615eb3796406500fba1b148d3d", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.29583988503531067, "ground_truth": 0}, {"key": "c3acabb0c18cc7615eb3796406500fba1b148d3d", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.2720245705270893, "ground_truth": 0}, {"key": "c3acabb0c18cc7615eb3796406500fba1b148d3d", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.4726834744343135, "ground_truth": 0}, {"key": "c3acabb0c18cc7615eb3796406500fba1b148d3d", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.6566582543705494, "ground_truth": 0}, {"key": "1c1acc74329fe61636f900df9dbcef5ed695e5c9", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.8333245868195888, "ground_truth": 0}, {"key": "1c1acc74329fe61636f900df9dbcef5ed695e5c9", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.8991213819823701, "ground_truth": 0}, {"key": "1c1acc74329fe61636f900df9dbcef5ed695e5c9", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.8469578547092471, "ground_truth": 0}, {"key": "1c1acc74329fe61636f900df9dbcef5ed695e5c9", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.8278281592173944, "ground_truth": 0}, {"key": "1c1acc74329fe61636f900df9dbcef5ed695e5c9", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.7813306339285885, "ground_truth": 0}, {"key": "f70a7abb6c5b0ef383ea12a4d9ca046a5bd854e5", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.26133092170173977, "ground_truth": 0}, {"key": "f70a7abb6c5b0ef383ea12a4d9ca046a5bd854e5", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.5698526567189076, "ground_truth": 0}, {"key": "f70a7abb6c5b0ef383ea12a4d9ca046a5bd854e5", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.38491213766517896, "ground_truth": 0}, {"key": "f70a7abb6c5b0ef383ea12a4d9ca046a5bd854e5", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.3557748899810226, "ground_truth": 0}, {"key": "f70a7abb6c5b0ef383ea12a4d9ca046a5bd854e5", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.4378234957892148, "ground_truth": 0}, {"key": "a3dd38ec7bc9d7e8423b96d8fd0641a2a5d5c984", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.6992544111224274, "ground_truth": 0}, {"key": "a3dd38ec7bc9d7e8423b96d8fd0641a2a5d5c984", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.7994423173914462, "ground_truth": 0}, {"key": "a3dd38ec7bc9d7e8423b96d8fd0641a2a5d5c984", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.6671476644901679, "ground_truth": 0}, {"key": "a3dd38ec7bc9d7e8423b96d8fd0641a2a5d5c984", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.6495786302792386, "ground_truth": 0}, {"key": "a3dd38ec7bc9d7e8423b96d8fd0641a2a5d5c984", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.6976089157692178, "ground_truth": 0}, {"key": "654c6b29b96d2a5a818d91400c20f838b0e8b6df", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.33285231004455257, "ground_truth": 0}, {"key": "654c6b29b96d2a5a818d91400c20f838b0e8b6df", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.3293917186658212, "ground_truth": 0}, {"key": "654c6b29b96d2a5a818d91400c20f838b0e8b6df", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.30239107072308136, "ground_truth": 0}, {"key": "654c6b29b96d2a5a818d91400c20f838b0e8b6df", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.23792990166976075, "ground_truth": 0}, {"key": "654c6b29b96d2a5a818d91400c20f838b0e8b6df", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.27048022153008433, "ground_truth": 0}, {"key": "764d9ce99a1e3f79d95fbc4b68adbce14e7f8bcd", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.8056321838479261, "ground_truth": 0}, {"key": "764d9ce99a1e3f79d95fbc4b68adbce14e7f8bcd", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.9420819116033985, "ground_truth": 0}, {"key": "764d9ce99a1e3f79d95fbc4b68adbce14e7f8bcd", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.8438951018950036, "ground_truth": 0}, {"key": "764d9ce99a1e3f79d95fbc4b68adbce14e7f8bcd", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.7401743519998933, "ground_truth": 0}, {"key": "764d9ce99a1e3f79d95fbc4b68adbce14e7f8bcd", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.7969253679457239, "ground_truth": 0}, {"key": "f16446db34e2861f0450dfa34d8cdda541ab7b19", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.366589753465511, "ground_truth": 0}, {"key": "f16446db34e2861f0450dfa34d8cdda541ab7b19", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.5506073416927318, "ground_truth": 0}, {"key": "f16446db34e2861f0450dfa34d8cdda541ab7b19", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.373875812860056, "ground_truth": 0}, {"key": "f16446db34e2861f0450dfa34d8cdda541ab7b19", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.4016878005171424, "ground_truth": 0}, {"key": "f16446db34e2861f0450dfa34d8cdda541ab7b19", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.4359015355072165, "ground_truth": 0}, {"key": "3e910c5b8425cd7c871a402a32ca44680b53ce5e", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.5156199476177241, "ground_truth": 0}, {"key": "3e910c5b8425cd7c871a402a32ca44680b53ce5e", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.5907792124125995, "ground_truth": 0}, {"key": "3e910c5b8425cd7c871a402a32ca44680b53ce5e", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.4960938392677033, "ground_truth": 0}, {"key": "3e910c5b8425cd7c871a402a32ca44680b53ce5e", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.3923368379225564, "ground_truth": 0}, {"key": "3e910c5b8425cd7c871a402a32ca44680b53ce5e", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.535098425984838, "ground_truth": 0}, {"key": "973c14551fc97a1eef094bd0f33356d9e6836234", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.6187804407044656, "ground_truth": 0}, {"key": "973c14551fc97a1eef094bd0f33356d9e6836234", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.7401743580573213, "ground_truth": 0}, {"key": "973c14551fc97a1eef094bd0f33356d9e6836234", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.4513264968941965, "ground_truth": 0}, {"key": "973c14551fc97a1eef094bd0f33356d9e6836234", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.5, "ground_truth": 0}, {"key": "973c14551fc97a1eef094bd0f33356d9e6836234", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.47073662217941464, "ground_truth": 0}, {"key": "725938611c7dca6f876ada93b1d68b29ad25ce38", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.6460136958117504, "ground_truth": 0}, {"key": "725938611c7dca6f876ada93b1d68b29ad25ce38", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.5214711729325827, "ground_truth": 0}, {"key": "725938611c7dca6f876ada93b1d68b29ad25ce38", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.6992544103607093, "ground_truth": 0}, {"key": "725938611c7dca6f876ada93b1d68b29ad25ce38", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.7025300336258355, "ground_truth": 0}, {"key": "725938611c7dca6f876ada93b1d68b29ad25ce38", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.46490157419596784, "ground_truth": 0}, {"key": "28dbcf0c8624d9914a4e4292f872f17b063547c2", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.9207896793411078, "ground_truth": 0}, {"key": "28dbcf0c8624d9914a4e4292f872f17b063547c2", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.8774767884987064, "ground_truth": 0}, {"key": "28dbcf0c8624d9914a4e4292f872f17b063547c2", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.8732148241716594, "ground_truth": 0}, {"key": "28dbcf0c8624d9914a4e4292f872f17b063547c2", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.7264256011775572, "ground_truth": 0}, {"key": "28dbcf0c8624d9914a4e4292f872f17b063547c2", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.7981867768653529, "ground_truth": 0}, {"key": "4567b2098569ee4346cfdede5819257af4ee9c0f", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.5774953669366786, "ground_truth": 0}, {"key": "4567b2098569ee4346cfdede5819257af4ee9c0f", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.6150878605020975, "ground_truth": 0}, {"key": "4567b2098569ee4346cfdede5819257af4ee9c0f", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.5506073794723094, "ground_truth": 0}, {"key": "4567b2098569ee4346cfdede5819257af4ee9c0f", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.6113819813896799, "ground_truth": 0}, {"key": "4567b2098569ee4346cfdede5819257af4ee9c0f", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.5019531297289542, "ground_truth": 0}, {"key": "d0404188997ef57e0355b18fb867599b89c80407", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.8774767749060796, "ground_truth": 0}, {"key": "d0404188997ef57e0355b18fb867599b89c80407", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.853912755116825, "ground_truth": 0}, {"key": "d0404188997ef57e0355b18fb867599b89c80407", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.8714748541617344, "ground_truth": 0}, {"key": "d0404188997ef57e0355b18fb867599b89c80407", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.891054941564599, "ground_truth": 0}, {"key": "d0404188997ef57e0355b18fb867599b89c80407", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.815232489568586, "ground_truth": 0}, {"key": "ab10b3f8c4a6cca7aea94298447b13bc0721fe69", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.8984105616098284, "ground_truth": 0}, {"key": "ab10b3f8c4a6cca7aea94298447b13bc0721fe69", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.889528846921929, "ground_truth": 0}, {"key": "ab10b3f8c4a6cca7aea94298447b13bc0721fe69", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.8918110391420035, "ground_truth": 0}, {"key": "ab10b3f8c4a6cca7aea94298447b13bc0721fe69", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.9556514186109032, "ground_truth": 0}, {"key": "ab10b3f8c4a6cca7aea94298447b13bc0721fe69", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.7279754617205553, "ground_truth": 0}, {"key": "7c11a3353593edde95bae0ee6178fb1d1855baed", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.33458944247486705, "ground_truth": 0}, {"key": "7c11a3353593edde95bae0ee6178fb1d1855baed", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.49609382927518103, "ground_truth": 0}, {"key": "7c11a3353593edde95bae0ee6178fb1d1855baed", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.16132023549248342, "ground_truth": 0}, {"key": "7c11a3353593edde95bae0ee6178fb1d1855baed", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.43590151747639316, "ground_truth": 0}, {"key": "7c11a3353593edde95bae0ee6178fb1d1855baed", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.2861692334999966, "ground_truth": 0}, {"key": "487b272b94a620f9660e89bbf6ebab3ffdf1bf06", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.40733339941245306, "ground_truth": 0}, {"key": "487b272b94a620f9660e89bbf6ebab3ffdf1bf06", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.3793783926725953, "ground_truth": 0}, {"key": "487b272b94a620f9660e89bbf6ebab3ffdf1bf06", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.3886180318975931, "ground_truth": 0}, {"key": "487b272b94a620f9660e89bbf6ebab3ffdf1bf06", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.14608725144363557, "ground_truth": 0}, {"key": "487b272b94a620f9660e89bbf6ebab3ffdf1bf06", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.5964331358697228, "ground_truth": 0}, {"key": "e1b6f4701835710d3f518729188754fcd7061289", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.6460136956042739, "ground_truth": 0}, {"key": "e1b6f4701835710d3f518729188754fcd7061289", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.3720487991804501, "ground_truth": 0}, {"key": "e1b6f4701835710d3f518729188754fcd7061289", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.2974699505735753, "ground_truth": 0}, {"key": "e1b6f4701835710d3f518729188754fcd7061289", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.5755879902538642, "ground_truth": 0}, {"key": "e1b6f4701835710d3f518729188754fcd7061289", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.47852883285136105, "ground_truth": 0}, {"key": "45027afbe54056c567ca8a48906dd06200f6d8c1", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.9629528317876613, "ground_truth": 0}, {"key": "45027afbe54056c567ca8a48906dd06200f6d8c1", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.972830766697249, "ground_truth": 0}, {"key": "45027afbe54056c567ca8a48906dd06200f6d8c1", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.9755769095253004, "ground_truth": 0}, {"key": "45027afbe54056c567ca8a48906dd06200f6d8c1", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.8723473735739139, "ground_truth": 0}, {"key": "45027afbe54056c567ca8a48906dd06200f6d8c1", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.9458012708355393, "ground_truth": 0}, {"key": "e8c2d4a1d20efb0606506435ebcbf486e9eb4146", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.5851011601907297, "ground_truth": 0}, {"key": "e8c2d4a1d20efb0606506435ebcbf486e9eb4146", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.7446563499028042, "ground_truth": 0}, {"key": "e8c2d4a1d20efb0606506435ebcbf486e9eb4146", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.4111108638982229, "ground_truth": 0}, {"key": "e8c2d4a1d20efb0606506435ebcbf486e9eb4146", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.46490156205519223, "ground_truth": 0}, {"key": "e8c2d4a1d20efb0606506435ebcbf486e9eb4146", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.6791786971067583, "ground_truth": 0}, {"key": "da0ea6b7eae20528c7ec822fb77d8e8f78ba09b8", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.5486734785934303, "ground_truth": 0}, {"key": "da0ea6b7eae20528c7ec822fb77d8e8f78ba09b8", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.6460136886825746, "ground_truth": 0}, {"key": "da0ea6b7eae20528c7ec822fb77d8e8f78ba09b8", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.5563995811685664, "ground_truth": 0}, {"key": "da0ea6b7eae20528c7ec822fb77d8e8f78ba09b8", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.5292634124784898, "ground_truth": 0}, {"key": "da0ea6b7eae20528c7ec822fb77d8e8f78ba09b8", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.3960681718058952, "ground_truth": 0}, {"key": "42ab0385b3bb93236804c2abc9ff261b6ec79872", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.6352224629847463, "ground_truth": 0}, {"key": "42ab0385b3bb93236804c2abc9ff261b6ec79872", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.685949478548458, "ground_truth": 0}, {"key": "42ab0385b3bb93236804c2abc9ff261b6ec79872", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.7008948206456109, "ground_truth": 0}, {"key": "42ab0385b3bb93236804c2abc9ff261b6ec79872", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.689305621332814, "ground_truth": 0}, {"key": "42ab0385b3bb93236804c2abc9ff261b6ec79872", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.5019530969811652, "ground_truth": 0}, {"key": "3ad31f0dd26f2dce06da1c10ced8d601bd5594c5", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.24508500454695087, "ground_truth": 0}, {"key": "3ad31f0dd26f2dce06da1c10ced8d601bd5594c5", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.324235407960152, "ground_truth": 0}, {"key": "3ad31f0dd26f2dce06da1c10ced8d601bd5594c5", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.3867634342459873, "ground_truth": 0}, {"key": "3ad31f0dd26f2dce06da1c10ced8d601bd5594c5", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.18242552499420328, "ground_truth": 0}, {"key": "3ad31f0dd26f2dce06da1c10ced8d601bd5594c5", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.2720245759839125, "ground_truth": 0}, {"key": "a142b867b5b52449a790e8a2942654fd880cd2e4", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.8955226730195686, "ground_truth": 0}, {"key": "a142b867b5b52449a790e8a2942654fd880cd2e4", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.9543079692711144, "ground_truth": 0}, {"key": "a142b867b5b52449a790e8a2942654fd880cd2e4", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.903294205488464, "ground_truth": 0}, {"key": "a142b867b5b52449a790e8a2942654fd880cd2e4", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.8244619430347231, "ground_truth": 0}, {"key": "a142b867b5b52449a790e8a2942654fd880cd2e4", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.9485372340420334, "ground_truth": 0}, {"key": "04b39ee42fdc4284e402fbf7cdc7b825748f38b5", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.9263037299960206, "ground_truth": 0}, {"key": "04b39ee42fdc4284e402fbf7cdc7b825748f38b5", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.9376689634314501, "ground_truth": 0}, {"key": "04b39ee42fdc4284e402fbf7cdc7b825748f38b5", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.9309620690243424, "ground_truth": 0}, {"key": "04b39ee42fdc4284e402fbf7cdc7b825748f38b5", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.7943849858120705, "ground_truth": 0}, {"key": "04b39ee42fdc4284e402fbf7cdc7b825748f38b5", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.9420819117603606, "ground_truth": 0}, {"key": "ddafab36467762e9f1856687a7ef0e801243dace", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.28298812258621137, "ground_truth": 0}, {"key": "ddafab36467762e9f1856687a7ef0e801243dace", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.40356686837606914, "ground_truth": 0}, {"key": "ddafab36467762e9f1856687a7ef0e801243dace", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.28457600560217144, "ground_truth": 0}, {"key": "ddafab36467762e9f1856687a7ef0e801243dace", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.5039061737868923, "ground_truth": 0}, {"key": "ddafab36467762e9f1856687a7ef0e801243dace", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.3998116720310996, "ground_truth": 0}, {"key": "6c177720c8623edcaefc45111018f98811c29693", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.48242911740349015, "ground_truth": 0}, {"key": "6c177720c8623edcaefc45111018f98811c29693", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.5370413995629947, "ground_truth": 0}, {"key": "6c177720c8623edcaefc45111018f98811c29693", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.7106283035625489, "ground_truth": 0}, {"key": "6c177720c8623edcaefc45111018f98811c29693", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.712232185894347, "ground_truth": 0}, {"key": "6c177720c8623edcaefc45111018f98811c29693", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.6959583228016218, "ground_truth": 0}, {"key": "5365dfc7c7079ade7d090530f5ce0d8995a8f1cc", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.9473810445469902, "ground_truth": 0}, {"key": "5365dfc7c7079ade7d090530f5ce0d8995a8f1cc", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.9289263302341336, "ground_truth": 0}, {"key": "5365dfc7c7079ade7d090530f5ce0d8995a8f1cc", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.9173026523884318, "ground_truth": 0}, {"key": "5365dfc7c7079ade7d090530f5ce0d8995a8f1cc", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.8723473845585419, "ground_truth": 0}, {"key": "5365dfc7c7079ade7d090530f5ce0d8995a8f1cc", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.8774767868463442, "ground_truth": 0}, {"key": "6235695e9e69aa35c488636fc63bae84d1e2ca1f", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.7356416242869028, "ground_truth": 0}, {"key": "6235695e9e69aa35c488636fc63bae84d1e2ca1f", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.5058591228416729, "ground_truth": 0}, {"key": "6235695e9e69aa35c488636fc63bae84d1e2ca1f", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.5602526632950907, "ground_truth": 0}, {"key": "6235695e9e69aa35c488636fc63bae84d1e2ca1f", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.6442251088003408, "ground_truth": 0}, {"key": "6235695e9e69aa35c488636fc63bae84d1e2ca1f", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.5774953704976714, "ground_truth": 0}, {"key": "d954f33da49f4c839a6f4dadc446a4c30328c572", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.8661325102245544, "ground_truth": 0}, {"key": "d954f33da49f4c839a6f4dadc446a4c30328c572", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.9385759598721801, "ground_truth": 0}, {"key": "d954f33da49f4c839a6f4dadc446a4c30328c572", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.7704648112674795, "ground_truth": 0}, {"key": "d954f33da49f4c839a6f4dadc446a4c30328c572", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.8031738004619943, "ground_truth": 0}, {"key": "d954f33da49f4c839a6f4dadc446a4c30328c572", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.8679338572352203, "ground_truth": 0}, {"key": "5bdab1456ce6156a7378edaa4fa92a718cbf2568", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.6566582398871664, "ground_truth": 0}, {"key": "5bdab1456ce6156a7378edaa4fa92a718cbf2568", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.8344068776533337, "ground_truth": 0}, {"key": "5bdab1456ce6156a7378edaa4fa92a718cbf2568", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.6943026708335088, "ground_truth": 0}, {"key": "5bdab1456ce6156a7378edaa4fa92a718cbf2568", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.5755880056841939, "ground_truth": 0}, {"key": "5bdab1456ce6156a7378edaa4fa92a718cbf2568", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.7879312110941936, "ground_truth": 0}, {"key": "c03cd67baa8d84240b962876a5aaa2036d4f5275", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.49218812700343073, "ground_truth": 0}, {"key": "c03cd67baa8d84240b962876a5aaa2036d4f5275", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.41869693145189424, "ground_truth": 0}, {"key": "c03cd67baa8d84240b962876a5aaa2036d4f5275", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.6808786103182487, "ground_truth": 0}, {"key": "c03cd67baa8d84240b962876a5aaa2036d4f5275", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.7310585889127239, "ground_truth": 0}, {"key": "c03cd67baa8d84240b962876a5aaa2036d4f5275", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.8056321893224353, "ground_truth": 0}, {"key": "e2847808e1990f51cd54eccd660640c44638f088", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.1460872488431323, "ground_truth": 0}, {"key": "e2847808e1990f51cd54eccd660640c44638f088", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.355774876325165, "ground_truth": 0}, {"key": "e2847808e1990f51cd54eccd660640c44638f088", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.1778108715356952, "ground_truth": 0}, {"key": "e2847808e1990f51cd54eccd660640c44638f088", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.26588046824777195, "ground_truth": 0}, {"key": "e2847808e1990f51cd54eccd660640c44638f088", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.2450850144152416, "ground_truth": 0}, {"key": "fbc2d5f3f088eda2b8128ebb12a042850f6e4f3d", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.6740504877760902, "ground_truth": 0}, {"key": "fbc2d5f3f088eda2b8128ebb12a042850f6e4f3d", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.4436004228599944, "ground_truth": 0}, {"key": "fbc2d5f3f088eda2b8128ebb12a042850f6e4f3d", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.5583270194905364, "ground_truth": 0}, {"key": "fbc2d5f3f088eda2b8128ebb12a042850f6e4f3d", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.5851011581341959, "ground_truth": 0}, {"key": "fbc2d5f3f088eda2b8128ebb12a042850f6e4f3d", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.5583269956907243, "ground_truth": 0}, {"key": "6f0d219aba6227e0a69e71e7fca4b85ae761101d", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.7138307659223382, "ground_truth": 0}, {"key": "6f0d219aba6227e0a69e71e7fca4b85ae761101d", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.43206338885726414, "ground_truth": 0}, {"key": "6f0d219aba6227e0a69e71e7fca4b85ae761101d", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.6132365638178244, "ground_truth": 0}, {"key": "6f0d219aba6227e0a69e71e7fca4b85ae761101d", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.4902356155419262, "ground_truth": 0}, {"key": "6f0d219aba6227e0a69e71e7fca4b85ae761101d", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.6224593421029813, "ground_truth": 0}, {"key": "8c71492f2a3fbe7eb9c8205d65054ab14c1dbdb6", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.4455295344027635, "ground_truth": 0}, {"key": "8c71492f2a3fbe7eb9c8205d65054ab14c1dbdb6", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.7090191562644677, "ground_truth": 0}, {"key": "8c71492f2a3fbe7eb9c8205d65054ab14c1dbdb6", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.9390248169619497, "ground_truth": 0}, {"key": "8c71492f2a3fbe7eb9c8205d65054ab14c1dbdb6", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.7217431875089326, "ground_truth": 0}, {"key": "8c71492f2a3fbe7eb9c8205d65054ab14c1dbdb6", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.6926419959530709, "ground_truth": 0}, {"key": "860cea3a6afb8527d26e9234ccba560a39eff2a7", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.8740772240466564, "ground_truth": 0}, {"key": "860cea3a6afb8527d26e9234ccba560a39eff2a7", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.5602526731696587, "ground_truth": 0}, {"key": "860cea3a6afb8527d26e9234ccba560a39eff2a7", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.8164063704068482, "ground_truth": 0}, {"key": "860cea3a6afb8527d26e9234ccba560a39eff2a7", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.824461938452342, "ground_truth": 0}, {"key": "860cea3a6afb8527d26e9234ccba560a39eff2a7", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.8438950956728132, "ground_truth": 0}, {"key": "0914e3c80a676e14e225504cb759103503f3f1e0", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.883235980070262, "ground_truth": 0}, {"key": "0914e3c80a676e14e225504cb759103503f3f1e0", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.9118099525231589, "ground_truth": 0}, {"key": "0914e3c80a676e14e225504cb759103503f3f1e0", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.8596637292894431, "ground_truth": 0}, {"key": "0914e3c80a676e14e225504cb759103503f3f1e0", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.879974374852613, "ground_truth": 0}, {"key": "0914e3c80a676e14e225504cb759103503f3f1e0", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.9309620694474652, "ground_truth": 0}, {"key": "82a0e1f034174079179821b052f33df76c781b47", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.4863315417672945, "ground_truth": 0}, {"key": "82a0e1f034174079179821b052f33df76c781b47", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.7520125530718241, "ground_truth": 0}, {"key": "82a0e1f034174079179821b052f33df76c781b47", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.6774740196294036, "ground_truth": 0}, {"key": "82a0e1f034174079179821b052f33df76c781b47", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.5794003993107116, "ground_truth": 0}, {"key": "82a0e1f034174079179821b052f33df76c781b47", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.6424324807520356, "ground_truth": 0}, {"key": "449c536051eba7070b18a7b33ebcf024891cb913", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.2509127802554809, "ground_truth": 0}, {"key": "449c536051eba7070b18a7b33ebcf024891cb913", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.34334174038815884, "ground_truth": 0}, {"key": "449c536051eba7070b18a7b33ebcf024891cb913", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.9005297873381393, "ground_truth": 0}, {"key": "449c536051eba7070b18a7b33ebcf024891cb913", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.4092208094321286, "ground_truth": 0}, {"key": "449c536051eba7070b18a7b33ebcf024891cb913", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.43974733962864876, "ground_truth": 0}, {"key": "696d5716c42ab1096cdb464da3cfcf702626a62a", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.9603611576454523, "ground_truth": 0}, {"key": "696d5716c42ab1096cdb464da3cfcf702626a62a", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.9529258210919707, "ground_truth": 0}, {"key": "696d5716c42ab1096cdb464da3cfcf702626a62a", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.9697854091108867, "ground_truth": 0}, {"key": "696d5716c42ab1096cdb464da3cfcf702626a62a", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.9832145095479888, "ground_truth": 0}, {"key": "696d5716c42ab1096cdb464da3cfcf702626a62a", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.9469902275471954, "ground_truth": 0}, {"key": "316f0f847800fdb547f7496f6095075cd610c7e4", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.967410255597151, "ground_truth": 0}, {"key": "316f0f847800fdb547f7496f6095075cd610c7e4", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.9658995716964459, "ground_truth": 0}, {"key": "316f0f847800fdb547f7496f6095075cd610c7e4", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.9566342029542336, "ground_truth": 0}, {"key": "316f0f847800fdb547f7496f6095075cd610c7e4", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.9702399073005007, "ground_truth": 0}, {"key": "316f0f847800fdb547f7496f6095075cd610c7e4", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.9241418232598039, "ground_truth": 0}, {"key": "28e251ea722829df08d63e83824110fedcc13f8c", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.5195213336553703, "ground_truth": 0}, {"key": "28e251ea722829df08d63e83824110fedcc13f8c", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.4532618738070049, "ground_truth": 0}, {"key": "28e251ea722829df08d63e83824110fedcc13f8c", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.7431679905467576, "ground_truth": 0}, {"key": "28e251ea722829df08d63e83824110fedcc13f8c", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.4148988697246457, "ground_truth": 0}, {"key": "28e251ea722829df08d63e83824110fedcc13f8c", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.5467381411538927, "ground_truth": 0}, {"key": "4812698545d6a4c2243db340fad08d0b3b7fbe0b", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.6352224349790896, "ground_truth": 0}, {"key": "4812698545d6a4c2243db340fad08d0b3b7fbe0b", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.4225046153441557, "ground_truth": 0}, {"key": "4812698545d6a4c2243db340fad08d0b3b7fbe0b", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.5964331083629827, "ground_truth": 0}, {"key": "4812698545d6a4c2243db340fad08d0b3b7fbe0b", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.5039061497800414, "ground_truth": 0}, {"key": "4812698545d6a4c2243db340fad08d0b3b7fbe0b", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.372048784870183, "ground_truth": 0}, {"key": "81651fc015f2db10f24327d11b1a3748a19466f9", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.651354853503107, "ground_truth": 0}, {"key": "81651fc015f2db10f24327d11b1a3748a19466f9", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.4804786786430314, "ground_truth": 0}, {"key": "81651fc015f2db10f24327d11b1a3748a19466f9", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.4863315443133089, "ground_truth": 0}, {"key": "81651fc015f2db10f24327d11b1a3748a19466f9", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.6150878529584155, "ground_truth": 0}, {"key": "81651fc015f2db10f24327d11b1a3748a19466f9", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.44939263524698014, "ground_truth": 0}, {"key": "f85e12129885fad0eabd6a1c6b6b24dbf8948db5", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.5964331272667813, "ground_truth": 0}, {"key": "f85e12129885fad0eabd6a1c6b6b24dbf8948db5", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.7264256057838387, "ground_truth": 0}, {"key": "f85e12129885fad0eabd6a1c6b6b24dbf8948db5", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.3812195755421629, "ground_truth": 0}, {"key": "f85e12129885fad0eabd6a1c6b6b24dbf8948db5", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.4339814624853073, "ground_truth": 0}, {"key": "f85e12129885fad0eabd6a1c6b6b24dbf8948db5", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.6584174942747051, "ground_truth": 0}, {"key": "bffa402002700855fec36f83c8c226dfe271a6af", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.7170118633231248, "ground_truth": 0}, {"key": "bffa402002700855fec36f83c8c226dfe271a6af", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.7201715204231433, "ground_truth": 0}, {"key": "bffa402002700855fec36f83c8c226dfe271a6af", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.7577943670751867, "ground_truth": 0}, {"key": "bffa402002700855fec36f83c8c226dfe271a6af", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.7295197715331829, "ground_truth": 0}, {"key": "bffa402002700855fec36f83c8c226dfe271a6af", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.626124146851928, "ground_truth": 0}, {"key": "360df256327edcaf7ce0b99314adec8b0a2c5be6", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.5156198943302435, "ground_truth": 0}, {"key": "360df256327edcaf7ce0b99314adec8b0a2c5be6", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.4590761206691403, "ground_truth": 0}, {"key": "360df256327edcaf7ce0b99314adec8b0a2c5be6", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.466845589836271, "ground_truth": 0}, {"key": "360df256327edcaf7ce0b99314adec8b0a2c5be6", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.5234203510328092, "ground_truth": 0}, {"key": "360df256327edcaf7ce0b99314adec8b0a2c5be6", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.47268344446261773, "ground_truth": 0}, {"key": "35ae4229bbd571d86bb817df03b3784dc8cbf660", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.877476793501779, "ground_truth": 0}, {"key": "35ae4229bbd571d86bb817df03b3784dc8cbf660", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.8856314834869042, "ground_truth": 0}, {"key": "35ae4229bbd571d86bb817df03b3784dc8cbf660", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.7295197686188357, "ground_truth": 0}, {"key": "35ae4229bbd571d86bb817df03b3784dc8cbf660", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.8489722075480316, "ground_truth": 0}, {"key": "35ae4229bbd571d86bb817df03b3784dc8cbf660", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.9086178917934725, "ground_truth": 0}, {"key": "fd93b423a3805de1c259d527393fd5fb75d06a55", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.5428632616520067, "ground_truth": 0}, {"key": "fd93b423a3805de1c259d527393fd5fb75d06a55", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.35398630973162715, "ground_truth": 0}, {"key": "fd93b423a3805de1c259d527393fd5fb75d06a55", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.36840571082947365, "ground_truth": 0}, {"key": "fd93b423a3805de1c259d527393fd5fb75d06a55", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.692641988760252, "ground_truth": 0}, {"key": "fd93b423a3805de1c259d527393fd5fb75d06a55", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.39420094923913734, "ground_truth": 0}, {"key": "646676aabe72e75add3cde2d6afa56cea64c91a4", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.894051711914072, "ground_truth": 0}, {"key": "646676aabe72e75add3cde2d6afa56cea64c91a4", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.9546474191465468, "ground_truth": 0}, {"key": "646676aabe72e75add3cde2d6afa56cea64c91a4", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.9609517091516637, "ground_truth": 0}, {"key": "646676aabe72e75add3cde2d6afa56cea64c91a4", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.8519527906708712, "ground_truth": 0}, {"key": "646676aabe72e75add3cde2d6afa56cea64c91a4", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.8910549426464657, "ground_truth": 0}, {"key": "5acf12b2ef7771fd1cd1421acb7057d9a64be818", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.7866228411453441, "ground_truth": 0}, {"key": "5acf12b2ef7771fd1cd1421acb7057d9a64be818", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.915507253381036, "ground_truth": 0}, {"key": "5acf12b2ef7771fd1cd1421acb7057d9a64be818", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.7662936491395652, "ground_truth": 0}, {"key": "5acf12b2ef7771fd1cd1421acb7057d9a64be818", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.5851011681628548, "ground_truth": 0}, {"key": "5acf12b2ef7771fd1cd1421acb7057d9a64be818", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.7826624614833266, "ground_truth": 0}, {"key": "0239342f05436085947bd0c5173a4636ee772b51", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.31912139536256556, "ground_truth": 0}, {"key": "0239342f05436085947bd0c5173a4636ee772b51", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.3647775602484233, "ground_truth": 0}, {"key": "0239342f05436085947bd0c5173a4636ee772b51", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.5370413893349598, "ground_truth": 0}, {"key": "0239342f05436085947bd0c5173a4636ee772b51", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.30074558783756106, "ground_truth": 0}, {"key": "0239342f05436085947bd0c5173a4636ee772b51", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.50195312985798, "ground_truth": 0}, {"key": "1f40e358077ff22078a4e91e5114c4f86a4d52db", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.5058590979748412, "ground_truth": 0}, {"key": "1f40e358077ff22078a4e91e5114c4f86a4d52db", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.4649015776412408, "ground_truth": 0}, {"key": "1f40e358077ff22078a4e91e5114c4f86a4d52db", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.5583269764596195, "ground_truth": 0}, {"key": "1f40e358077ff22078a4e91e5114c4f86a4d52db", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.6076631631420428, "ground_truth": 0}, {"key": "1f40e358077ff22078a4e91e5114c4f86a4d52db", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.602061581244034, "ground_truth": 0}, {"key": "a8ac682f29acaad4b669781c39fb2804374b8b2b", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.7279754415775108, "ground_truth": 0}, {"key": "a8ac682f29acaad4b669781c39fb2804374b8b2b", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.7310585681821838, "ground_truth": 0}, {"key": "a8ac682f29acaad4b669781c39fb2804374b8b2b", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.7620701098203688, "ground_truth": 0}, {"key": "a8ac682f29acaad4b669781c39fb2804374b8b2b", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.8311430347344136, "ground_truth": 0}, {"key": "a8ac682f29acaad4b669781c39fb2804374b8b2b", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.32939170404905027, "ground_truth": 0}, {"key": "d4474ce9da725c1540ac826f3247f53d086808fb", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.7994423239313978, "ground_truth": 0}, {"key": "d4474ce9da725c1540ac826f3247f53d086808fb", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.8539127556956507, "ground_truth": 0}, {"key": "d4474ce9da725c1540ac826f3247f53d086808fb", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.7918210639022689, "ground_truth": 0}, {"key": "d4474ce9da725c1540ac826f3247f53d086808fb", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.7994423238096546, "ground_truth": 0}, {"key": "d4474ce9da725c1540ac826f3247f53d086808fb", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.8116759959046751, "ground_truth": 0}, {"key": "e74db6d20c456740ecb7b295c8d24489fb4f436f", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.3557748741093949, "ground_truth": 0}, {"key": "e74db6d20c456740ecb7b295c8d24489fb4f436f", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.36840571267098343, "ground_truth": 0}, {"key": "e74db6d20c456740ecb7b295c8d24489fb4f436f", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.6352224187191478, "ground_truth": 0}, {"key": "e74db6d20c456740ecb7b295c8d24489fb4f436f", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.6095241638455859, "ground_truth": 0}, {"key": "e74db6d20c456740ecb7b295c8d24489fb4f436f", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.35220178031615645, "ground_truth": 0}, {"key": "d79b790edcc3f5088161445102a656ae4adb8ab1", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.9130583529394064, "ground_truth": 0}, {"key": "d79b790edcc3f5088161445102a656ae4adb8ab1", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.6808786049049398, "ground_truth": 0}, {"key": "d79b790edcc3f5088161445102a656ae4adb8ab1", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.7606506450594214, "ground_truth": 0}, {"key": "d79b790edcc3f5088161445102a656ae4adb8ab1", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.6909762984442216, "ground_truth": 0}, {"key": "d79b790edcc3f5088161445102a656ae4adb8ab1", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.6825737381526146, "ground_truth": 0}, {"key": "47f028dbf53e028eb6636c85d8b3ee0de6a1de7b", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.7401743555825927, "ground_truth": 0}, {"key": "47f028dbf53e028eb6636c85d8b3ee0de6a1de7b", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.7386690839260779, "ground_truth": 0}, {"key": "47f028dbf53e028eb6636c85d8b3ee0de6a1de7b", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.7563575648600052, "ground_truth": 0}, {"key": "47f028dbf53e028eb6636c85d8b3ee0de6a1de7b", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.7648915945079199, "ground_truth": 0}, {"key": "47f028dbf53e028eb6636c85d8b3ee0de6a1de7b", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.8221891417818247, "ground_truth": 0}, {"key": "5f7a869908e864b70e83282b289ed1274c1f7f0d", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.4649015878781076, "ground_truth": 0}, {"key": "5f7a869908e864b70e83282b289ed1274c1f7f0d", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.4863315639412708, "ground_truth": 0}, {"key": "5f7a869908e864b70e83282b289ed1274c1f7f0d", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.6619228591835058, "ground_truth": 0}, {"key": "5f7a869908e864b70e83282b289ed1274c1f7f0d", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.394200984274224, "ground_truth": 0}, {"key": "5f7a869908e864b70e83282b289ed1274c1f7f0d", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.3380771391054751, "ground_truth": 0}, {"key": "59a9e7cad1c4c873738dda62b7e7b39bc2553710", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.6334102576388014, "ground_truth": 0}, {"key": "59a9e7cad1c4c873738dda62b7e7b39bc2553710", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.6976089249831737, "ground_truth": 0}, {"key": "59a9e7cad1c4c873738dda62b7e7b39bc2553710", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.7476159606762239, "ground_truth": 0}, {"key": "59a9e7cad1c4c873738dda62b7e7b39bc2553710", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.5679366069198553, "ground_truth": 0}, {"key": "59a9e7cad1c4c873738dda62b7e7b39bc2553710", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.5078118643854787, "ground_truth": 0}, {"key": "c47db89f5f9de3e599e2947ab7940eb65be0b433", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.6150878472230316, "ground_truth": 0}, {"key": "c47db89f5f9de3e599e2947ab7940eb65be0b433", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.7718435006458401, "ground_truth": 0}, {"key": "c47db89f5f9de3e599e2947ab7940eb65be0b433", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.5583269920476347, "ground_truth": 0}, {"key": "c47db89f5f9de3e599e2947ab7940eb65be0b433", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.7122321790754574, "ground_truth": 0}, {"key": "c47db89f5f9de3e599e2947ab7940eb65be0b433", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.6548947404990517, "ground_truth": 0}, {"key": "a74c3ff540cb154fc1294fd9d48b6a952329722b", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.5039061477685471, "ground_truth": 0}, {"key": "a74c3ff540cb154fc1294fd9d48b6a952329722b", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.6406358620725678, "ground_truth": 0}, {"key": "a74c3ff540cb154fc1294fd9d48b6a952329722b", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.6169358141820144, "ground_truth": 0}, {"key": "a74c3ff540cb154fc1294fd9d48b6a952329722b", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.2814056069752373, "ground_truth": 0}, {"key": "a74c3ff540cb154fc1294fd9d48b6a952329722b", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.6893056063479408, "ground_truth": 0}, {"key": "f5692f8e01389a631dadcb70cfd4be3ff0ae45d3", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.8791467650335109, "ground_truth": 0}, {"key": "f5692f8e01389a631dadcb70cfd4be3ff0ae45d3", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.8679338446815507, "ground_truth": 0}, {"key": "f5692f8e01389a631dadcb70cfd4be3ff0ae45d3", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.8449215422657805, "ground_truth": 0}, {"key": "f5692f8e01389a631dadcb70cfd4be3ff0ae45d3", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.7866228286998724, "ground_truth": 0}, {"key": "f5692f8e01389a631dadcb70cfd4be3ff0ae45d3", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.9161096146646084, "ground_truth": 0}, {"key": "467e1b592518a5660d0a3b7eda24ef9574fe0d11", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.7662936410216838, "ground_truth": 0}, {"key": "467e1b592518a5660d0a3b7eda24ef9574fe0d11", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.622459338453575, "ground_truth": 0}, {"key": "467e1b592518a5660d0a3b7eda24ef9574fe0d11", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.6566582697916632, "ground_truth": 0}, {"key": "467e1b592518a5660d0a3b7eda24ef9574fe0d11", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.6842640118021958, "ground_truth": 0}, {"key": "467e1b592518a5660d0a3b7eda24ef9574fe0d11", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.6460137165249242, "ground_truth": 0}, {"key": "61acf6de75325370728f6e290bafb01adc24a3ca", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.3451052586898561, "ground_truth": 0}, {"key": "61acf6de75325370728f6e290bafb01adc24a3ca", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.3757064774031961, "ground_truth": 0}, {"key": "61acf6de75325370728f6e290bafb01adc24a3ca", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.33458943632987076, "ground_truth": 0}, {"key": "61acf6de75325370728f6e290bafb01adc24a3ca", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.10374863125118207, "ground_truth": 0}, {"key": "61acf6de75325370728f6e290bafb01adc24a3ca", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.39233680811219396, "ground_truth": 0}, {"key": "172d2668b011501c20181b4925ebb6ba582f9a2f", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.6388352760410259, "ground_truth": 0}, {"key": "172d2668b011501c20181b4925ebb6ba582f9a2f", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.7185943926197932, "ground_truth": 0}, {"key": "172d2668b011501c20181b4925ebb6ba582f9a2f", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.4073334001020431, "ground_truth": 0}, {"key": "172d2668b011501c20181b4925ebb6ba582f9a2f", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.6706082836515499, "ground_truth": 0}, {"key": "172d2668b011501c20181b4925ebb6ba582f9a2f", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.6943026746112944, "ground_truth": 0}, {"key": "314c7c0104eb4113074619b3b3f1e9356114e2f5", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.7994423217390512, "ground_truth": 0}, {"key": "314c7c0104eb4113074619b3b3f1e9356114e2f5", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.8386797595629053, "ground_truth": 0}, {"key": "314c7c0104eb4113074619b3b3f1e9356114e2f5", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.8044059048025933, "ground_truth": 0}, {"key": "314c7c0104eb4113074619b3b3f1e9356114e2f5", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.8175744839222895, "ground_truth": 0}, {"key": "314c7c0104eb4113074619b3b3f1e9356114e2f5", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.8221891452554461, "ground_truth": 0}, {"key": "e66546893c2fa5fe38be74e1d1ed104f0c412b4d", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.644225104206278, "ground_truth": 0}, {"key": "e66546893c2fa5fe38be74e1d1ed104f0c412b4d", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.6548947119869022, "ground_truth": 0}, {"key": "e66546893c2fa5fe38be74e1d1ed104f0c412b4d", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.40356687700122873, "ground_truth": 0}, {"key": "e66546893c2fa5fe38be74e1d1ed104f0c412b4d", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.4092207756614303, "ground_truth": 0}, {"key": "e66546893c2fa5fe38be74e1d1ed104f0c412b4d", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.47463118758959333, "ground_truth": 0}, {"key": "04882672036936ca86bdebed819a133539cbd296", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.6057990561516404, "ground_truth": 0}, {"key": "04882672036936ca86bdebed819a133539cbd296", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.5253688018557895, "ground_truth": 0}, {"key": "04882672036936ca86bdebed819a133539cbd296", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.3522017693415112, "ground_truth": 0}, {"key": "04882672036936ca86bdebed819a133539cbd296", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.7341195324143072, "ground_truth": 0}, {"key": "04882672036936ca86bdebed819a133539cbd296", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.45907614189393997, "ground_truth": 0}, {"key": "d5342fb6d8d522f336f2ce34eaa6e62446c0da2e", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.46295858054593847, "ground_truth": 0}, {"key": "d5342fb6d8d522f336f2ce34eaa6e62446c0da2e", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.4244119972765612, "ground_truth": 0}, {"key": "d5342fb6d8d522f336f2ce34eaa6e62446c0da2e", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.4111108615289588, "ground_truth": 0}, {"key": "d5342fb6d8d522f336f2ce34eaa6e62446c0da2e", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.2568320037938544, "ground_truth": 0}, {"key": "d5342fb6d8d522f336f2ce34eaa6e62446c0da2e", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.6406358469119036, "ground_truth": 0}, {"key": "87cdc5b797032387ea9bd0c9a0d7fd57c088e65b", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.5019531192010069, "ground_truth": 0}, {"key": "87cdc5b797032387ea9bd0c9a0d7fd57c088e65b", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.5097644103608424, "ground_truth": 0}, {"key": "87cdc5b797032387ea9bd0c9a0d7fd57c088e65b", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.4359015326522908, "ground_truth": 0}, {"key": "87cdc5b797032387ea9bd0c9a0d7fd57c088e65b", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.5774953803765911, "ground_truth": 0}, {"key": "87cdc5b797032387ea9bd0c9a0d7fd57c088e65b", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.5698526577544127, "ground_truth": 0}, {"key": "4fd3285b643696cd49f08c14b0d482e559f32eed", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.6206216105579319, "ground_truth": 0}, {"key": "4fd3285b643696cd49f08c14b0d482e559f32eed", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.8187367917871489, "ground_truth": 0}, {"key": "4fd3285b643696cd49f08c14b0d482e559f32eed", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.6315943116836241, "ground_truth": 0}, {"key": "4fd3285b643696cd49f08c14b0d482e559f32eed", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.6132365594992093, "ground_truth": 0}, {"key": "4fd3285b643696cd49f08c14b0d482e559f32eed", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.7264256104576267, "ground_truth": 0}, {"key": "55930649e6f3cb285a26ef33525f8199bd86d089", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.29098087480829693, "ground_truth": 0}, {"key": "55930649e6f3cb285a26ef33525f8199bd86d089", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.23651623674273428, "ground_truth": 0}, {"key": "55930649e6f3cb285a26ef33525f8199bd86d089", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.4804786641225023, "ground_truth": 0}, {"key": "55930649e6f3cb285a26ef33525f8199bd86d089", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.6279512418978784, "ground_truth": 0}, {"key": "55930649e6f3cb285a26ef33525f8199bd86d089", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.590779199356892, "ground_truth": 0}, {"key": "8b1c9d7c48a0d857ae857a21395a4996de051915", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.6388352782290175, "ground_truth": 0}, {"key": "8b1c9d7c48a0d857ae857a21395a4996de051915", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.32594953168386587, "ground_truth": 0}, {"key": "8b1c9d7c48a0d857ae857a21395a4996de051915", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.3345894490107357, "ground_truth": 0}, {"key": "8b1c9d7c48a0d857ae857a21395a4996de051915", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.5813030845576851, "ground_truth": 0}, {"key": "8b1c9d7c48a0d857ae857a21395a4996de051915", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.3293917130714979, "ground_truth": 0}, {"key": "d95dce003f0fccc57742bd900c81897c45208c10", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.8386797695226784, "ground_truth": 0}, {"key": "d95dce003f0fccc57742bd900c81897c45208c10", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.6076631680421039, "ground_truth": 0}, {"key": "d95dce003f0fccc57742bd900c81897c45208c10", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.7853085767596004, "ground_truth": 0}, {"key": "d95dce003f0fccc57742bd900c81897c45208c10", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.7853085754451461, "ground_truth": 0}, {"key": "d95dce003f0fccc57742bd900c81897c45208c10", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.7563575534742331, "ground_truth": 0}, {"key": "f732a658c314c090257225483075e4d9fde28b95", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.8991213772643679, "ground_truth": 0}, {"key": "f732a658c314c090257225483075e4d9fde28b95", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.9669140197209528, "ground_truth": 0}, {"key": "f732a658c314c090257225483075e4d9fde28b95", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.9742394390735545, "ground_truth": 0}, {"key": "f732a658c314c090257225483075e4d9fde28b95", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.6723316794699115, "ground_truth": 0}, {"key": "f732a658c314c090257225483075e4d9fde28b95", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.9588471153359377, "ground_truth": 0}, {"key": "cbd21ed724b7e4a075ab4ae9a45d9e86d6151283", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.40168780963612416, "ground_truth": 0}, {"key": "cbd21ed724b7e4a075ab4ae9a45d9e86d6151283", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.49023560608636935, "ground_truth": 0}, {"key": "cbd21ed724b7e4a075ab4ae9a45d9e86d6151283", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.47073661070080286, "ground_truth": 0}, {"key": "cbd21ed724b7e4a075ab4ae9a45d9e86d6151283", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.30239108968260303, "ground_truth": 0}, {"key": "cbd21ed724b7e4a075ab4ae9a45d9e86d6151283", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.48633155074101037, "ground_truth": 0}, {"key": "4a32d5f29cfb35f3a3966ee041fc1f358503f4b4", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.7879312166312425, "ground_truth": 0}, {"key": "4a32d5f29cfb35f3a3966ee041fc1f358503f4b4", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.8962513779271422, "ground_truth": 0}, {"key": "4a32d5f29cfb35f3a3966ee041fc1f358503f4b4", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.8705972666385902, "ground_truth": 0}, {"key": "4a32d5f29cfb35f3a3966ee041fc1f358503f4b4", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.94292859785357, "ground_truth": 0}, {"key": "4a32d5f29cfb35f3a3966ee041fc1f358503f4b4", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.941654161837077, "ground_truth": 0}, {"key": "d470c9860671ae720ccc7df115a46d471b4b900a", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.9711290923322989, "ground_truth": 0}, {"key": "d470c9860671ae720ccc7df115a46d471b4b900a", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.9224823407102235, "ground_truth": 0}, {"key": "d470c9860671ae720ccc7df115a46d471b4b900a", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.9653811597652765, "ground_truth": 0}, {"key": "d470c9860671ae720ccc7df115a46d471b4b900a", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.9711290919457042, "ground_truth": 0}, {"key": "d470c9860671ae720ccc7df115a46d471b4b900a", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.8984105506622285, "ground_truth": 0}, {"key": "55327ce32c4d5168e8e0fa7b5dabc9a8aafd9d78", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.660172379683066, "ground_truth": 0}, {"key": "55327ce32c4d5168e8e0fa7b5dabc9a8aafd9d78", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.7217431921063231, "ground_truth": 0}, {"key": "55327ce32c4d5168e8e0fa7b5dabc9a8aafd9d78", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.5907791893229283, "ground_truth": 0}, {"key": "55327ce32c4d5168e8e0fa7b5dabc9a8aafd9d78", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.4073334241290999, "ground_truth": 0}, {"key": "55327ce32c4d5168e8e0fa7b5dabc9a8aafd9d78", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.47463119611922977, "ground_truth": 0}, {"key": "022c18def42072e28a37979c622c6ab7e31371de", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.5602526565451902, "ground_truth": 0}, {"key": "022c18def42072e28a37979c622c6ab7e31371de", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.8732148244867382, "ground_truth": 0}, {"key": "022c18def42072e28a37979c622c6ab7e31371de", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.6774740077883519, "ground_truth": 0}, {"key": "022c18def42072e28a37979c622c6ab7e31371de", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.7264256100313362, "ground_truth": 0}, {"key": "022c18def42072e28a37979c622c6ab7e31371de", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.6688802587325525, "ground_truth": 0}, {"key": "d49c8ddc7586fcc27a7d310a5cb7703f19e4607d", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.8152324933812681, "ground_truth": 0}, {"key": "d49c8ddc7586fcc27a7d310a5cb7703f19e4607d", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.7606506461820925, "ground_truth": 0}, {"key": "d49c8ddc7586fcc27a7d310a5cb7703f19e4607d", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.8688267737241849, "ground_truth": 0}, {"key": "d49c8ddc7586fcc27a7d310a5cb7703f19e4607d", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.786622807633102, "ground_truth": 0}, {"key": "d49c8ddc7586fcc27a7d310a5cb7703f19e4607d", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.9572778004047406, "ground_truth": 0}, {"key": "bda116dccb075585a67fd5dd5b759015c7577eb0", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.8558511418789303, "ground_truth": 0}, {"key": "bda116dccb075585a67fd5dd5b759015c7577eb0", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.6859494481363542, "ground_truth": 0}, {"key": "bda116dccb075585a67fd5dd5b759015c7577eb0", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.8244619167891059, "ground_truth": 0}, {"key": "bda116dccb075585a67fd5dd5b759015c7577eb0", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.7662936346538567, "ground_truth": 0}, {"key": "bda116dccb075585a67fd5dd5b759015c7577eb0", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.9118099575759397, "ground_truth": 0}, {"key": "ee0b1bc5ee40697c0792e3906000fe8be5be182a", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.7534666622031627, "ground_truth": 0}, {"key": "ee0b1bc5ee40697c0792e3906000fe8be5be182a", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.6334102584764582, "ground_truth": 0}, {"key": "ee0b1bc5ee40697c0792e3906000fe8be5be182a", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.7248702830303926, "ground_truth": 0}, {"key": "ee0b1bc5ee40697c0792e3906000fe8be5be182a", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.8221891510649753, "ground_truth": 0}, {"key": "ee0b1bc5ee40697c0792e3906000fe8be5be182a", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.598312211181473, "ground_truth": 0}, {"key": "75b0d4c21581a1b0c1fc5798adba334d8ecc34f3", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.45132651119047884, "ground_truth": 0}, {"key": "75b0d4c21581a1b0c1fc5798adba334d8ecc34f3", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.4804787166408086, "ground_truth": 0}, {"key": "75b0d4c21581a1b0c1fc5798adba334d8ecc34f3", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.476579638415068, "ground_truth": 0}, {"key": "75b0d4c21581a1b0c1fc5798adba334d8ecc34f3", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.5350984426144676, "ground_truth": 0}, {"key": "75b0d4c21581a1b0c1fc5798adba334d8ecc34f3", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.646013707476975, "ground_truth": 0}, {"key": "3f7e19cffef13f356e2298c5a63e6c8db20f3d91", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.33458946042358656, "ground_truth": 0}, {"key": "3f7e19cffef13f356e2298c5a63e6c8db20f3d91", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.5097643752582364, "ground_truth": 0}, {"key": "3f7e19cffef13f356e2298c5a63e6c8db20f3d91", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.6619228610994281, "ground_truth": 0}, {"key": "3f7e19cffef13f356e2298c5a63e6c8db20f3d91", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.7386690954061514, "ground_truth": 0}, {"key": "3f7e19cffef13f356e2298c5a63e6c8db20f3d91", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.45326184461037555, "ground_truth": 0}, {"key": "00359f516cdf8b1800c7102711bd9aa400d1c749", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.6297746324587166, "ground_truth": 0}, {"key": "00359f516cdf8b1800c7102711bd9aa400d1c749", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.7264256167034482, "ground_truth": 0}, {"key": "00359f516cdf8b1800c7102711bd9aa400d1c749", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.5698526363860262, "ground_truth": 0}, {"key": "00359f516cdf8b1800c7102711bd9aa400d1c749", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.6132365663056788, "ground_truth": 0}, {"key": "00359f516cdf8b1800c7102711bd9aa400d1c749", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.7620700978731153, "ground_truth": 0}, {"key": "f8be2f5ce06cb4af91cbb7b6bef9835991751ef5", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.796925376634716, "ground_truth": 0}, {"key": "f8be2f5ce06cb4af91cbb7b6bef9835991751ef5", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.5, "ground_truth": 0}, {"key": "f8be2f5ce06cb4af91cbb7b6bef9835991751ef5", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.4436004198867468, "ground_truth": 0}, {"key": "f8be2f5ce06cb4af91cbb7b6bef9835991751ef5", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.4416730262943126, "ground_truth": 0}, {"key": "f8be2f5ce06cb4af91cbb7b6bef9835991751ef5", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.4339814809361712, "ground_truth": 0}, {"key": "958a67b8550998886478275b404e2256a6b85c7c", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.4513265112722813, "ground_truth": 0}, {"key": "958a67b8550998886478275b404e2256a6b85c7c", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.47657964467355374, "ground_truth": 0}, {"key": "958a67b8550998886478275b404e2256a6b85c7c", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.581303074957727, "ground_truth": 0}, {"key": "958a67b8550998886478275b404e2256a6b85c7c", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.43398146381324954, "ground_truth": 0}, {"key": "958a67b8550998886478275b404e2256a6b85c7c", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.5813030837064452, "ground_truth": 0}, {"key": "4739f160c87994f52e894591194f5df06fed4c39", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.7505527520985947, "ground_truth": 0}, {"key": "4739f160c87994f52e894591194f5df06fed4c39", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.8300437554512351, "ground_truth": 0}, {"key": "4739f160c87994f52e894591194f5df06fed4c39", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.7025300693902956, "ground_truth": 0}, {"key": "4739f160c87994f52e894591194f5df06fed4c39", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.7969253708195551, "ground_truth": 0}, {"key": "4739f160c87994f52e894591194f5df06fed4c39", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.7879311983374935, "ground_truth": 0}, {"key": "027a99a889b38fdb935cd14c204a5fca8a329bc1", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.4282333983041189, "ground_truth": 0}, {"key": "027a99a889b38fdb935cd14c204a5fca8a329bc1", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.5019531090941056, "ground_truth": 0}, {"key": "027a99a889b38fdb935cd14c204a5fca8a329bc1", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.45713669478171387, "ground_truth": 0}, {"key": "027a99a889b38fdb935cd14c204a5fca8a329bc1", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.8969755694653524, "ground_truth": 0}, {"key": "027a99a889b38fdb935cd14c204a5fca8a329bc1", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.4148988191000809, "ground_truth": 0}, {"key": "c7c83a9ee902e568a55898c616f20181952ce057", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.5214711489073918, "ground_truth": 0}, {"key": "c7c83a9ee902e568a55898c616f20181952ce057", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.5660185330695426, "ground_truth": 0}, {"key": "c7c83a9ee902e568a55898c616f20181952ce057", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.4590761139001957, "ground_truth": 0}, {"key": "c7c83a9ee902e568a55898c616f20181952ce057", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.5832033560312686, "ground_truth": 0}, {"key": "c7c83a9ee902e568a55898c616f20181952ce057", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.75491498868734, "ground_truth": 0}, {"key": "7bff6a60ff0b62855bd28562bb820233c0c940e0", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.8044059247762118, "ground_truth": 0}, {"key": "7bff6a60ff0b62855bd28562bb820233c0c940e0", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.7772998789955285, "ground_truth": 0}, {"key": "7bff6a60ff0b62855bd28562bb820233c0c940e0", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.8255897178387509, "ground_truth": 0}, {"key": "7bff6a60ff0b62855bd28562bb820233c0c940e0", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.7853085745854097, "ground_truth": 0}, {"key": "7bff6a60ff0b62855bd28562bb820233c0c940e0", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.6757646000847041, "ground_truth": 0}, {"key": "5ba5e49e25610f42416b2e7ba76d7496acab0f78", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.36477756738939776, "ground_truth": 0}, {"key": "5ba5e49e25610f42416b2e7ba76d7496acab0f78", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.46684561816862635, "ground_truth": 0}, {"key": "5ba5e49e25610f42416b2e7ba76d7496acab0f78", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.5640984590459709, "ground_truth": 0}, {"key": "5ba5e49e25610f42416b2e7ba76d7496acab0f78", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.5563995735191206, "ground_truth": 0}, {"key": "5ba5e49e25610f42416b2e7ba76d7496acab0f78", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.5350984176827261, "ground_truth": 0}, {"key": "0961a6a9fef7ad978ab866a57415578a49ba187f", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.5794004088451795, "ground_truth": 0}, {"key": "0961a6a9fef7ad978ab866a57415578a49ba187f", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.40544872861165604, "ground_truth": 0}, {"key": "0961a6a9fef7ad978ab866a57415578a49ba187f", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.5019531173873106, "ground_truth": 0}, {"key": "0961a6a9fef7ad978ab866a57415578a49ba187f", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.3140505607327464, "ground_truth": 0}, {"key": "0961a6a9fef7ad978ab866a57415578a49ba187f", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.4474602793645577, "ground_truth": 0}, {"key": "94148575d23050ffbedb00bddbd826d7137a4fe4", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.633410249337533, "ground_truth": 0}, {"key": "94148575d23050ffbedb00bddbd826d7137a4fe4", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.8322366577146243, "ground_truth": 0}, {"key": "94148575d23050ffbedb00bddbd826d7137a4fe4", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.8428631477607, "ground_truth": 0}, {"key": "94148575d23050ffbedb00bddbd826d7137a4fe4", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.7325918295119757, "ground_truth": 0}, {"key": "94148575d23050ffbedb00bddbd826d7137a4fe4", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.7431679815422378, "ground_truth": 0}, {"key": "aaa346e0be1ef1b9c2ce152c859b30e364ea3bc0", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.8895288508552842, "ground_truth": 0}, {"key": "aaa346e0be1ef1b9c2ce152c859b30e364ea3bc0", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.7620700933803629, "ground_truth": 0}, {"key": "aaa346e0be1ef1b9c2ce152c859b30e364ea3bc0", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.7431680006473016, "ground_truth": 0}, {"key": "aaa346e0be1ef1b9c2ce152c859b30e364ea3bc0", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.8289388096937337, "ground_truth": 0}, {"key": "aaa346e0be1ef1b9c2ce152c859b30e364ea3bc0", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.7759445495957356, "ground_truth": 0}, {"key": "7604af04967436c4aaf0c7df8b09afcec82f5be0", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.5774953598992524, "ground_truth": 0}, {"key": "7604af04967436c4aaf0c7df8b09afcec82f5be0", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.5583269950762145, "ground_truth": 0}, {"key": "7604af04967436c4aaf0c7df8b09afcec82f5be0", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.5019531222803097, "ground_truth": 0}, {"key": "7604af04967436c4aaf0c7df8b09afcec82f5be0", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.6791786909723143, "ground_truth": 0}, {"key": "7604af04967436c4aaf0c7df8b09afcec82f5be0", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.8558511488356517, "ground_truth": 0}, {"key": "1be68b94413120c0b2c7514ffd14b9cfc4413f90", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.5755880265423945, "ground_truth": 0}, {"key": "1be68b94413120c0b2c7514ffd14b9cfc4413f90", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.6706082988864042, "ground_truth": 0}, {"key": "1be68b94413120c0b2c7514ffd14b9cfc4413f90", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.7356416486804651, "ground_truth": 0}, {"key": "1be68b94413120c0b2c7514ffd14b9cfc4413f90", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.5253688392576717, "ground_truth": 0}, {"key": "1be68b94413120c0b2c7514ffd14b9cfc4413f90", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.7090191340234873, "ground_truth": 0}, {"key": "44fc3a2bc441a674f1ebdeabae73278977909db4", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.7662936550650746, "ground_truth": 0}, {"key": "44fc3a2bc441a674f1ebdeabae73278977909db4", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.7264256072442657, "ground_truth": 0}, {"key": "44fc3a2bc441a674f1ebdeabae73278977909db4", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.7371581548694267, "ground_truth": 0}, {"key": "44fc3a2bc441a674f1ebdeabae73278977909db4", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.6774740169360759, "ground_truth": 0}, {"key": "44fc3a2bc441a674f1ebdeabae73278977909db4", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.8407825969704508, "ground_truth": 0}, {"key": "fbb06b75e3963c5a810c9f73e4dc5382fbcb7405", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.61323653703255, "ground_truth": 0}, {"key": "fbb06b75e3963c5a810c9f73e4dc5382fbcb7405", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.7505527689082522, "ground_truth": 0}, {"key": "fbb06b75e3963c5a810c9f73e4dc5382fbcb7405", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.7041601337675601, "ground_truth": 0}, {"key": "fbb06b75e3963c5a810c9f73e4dc5382fbcb7405", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.6242935308770107, "ground_truth": 0}, {"key": "fbb06b75e3963c5a810c9f73e4dc5382fbcb7405", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.7008947998883248, "ground_truth": 0}, {"key": "551839469c1133ef4697ed435c5de192e6076858", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.8558511473340944, "ground_truth": 0}, {"key": "551839469c1133ef4697ed435c5de192e6076858", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.7520125596557115, "ground_truth": 0}, {"key": "551839469c1133ef4697ed435c5de192e6076858", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.759225402772641, "ground_truth": 0}, {"key": "551839469c1133ef4697ed435c5de192e6076858", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.6757646077938881, "ground_truth": 0}, {"key": "551839469c1133ef4697ed435c5de192e6076858", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.7090191308257792, "ground_truth": 0}, {"key": "386e149797954c4b5cd52bcad0beece29f7eb04a", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.8031737993769021, "ground_truth": 0}, {"key": "386e149797954c4b5cd52bcad0beece29f7eb04a", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.4863315333180506, "ground_truth": 0}, {"key": "386e149797954c4b5cd52bcad0beece29f7eb04a", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.8732148373638796, "ground_truth": 0}, {"key": "386e149797954c4b5cd52bcad0beece29f7eb04a", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.8278281586711622, "ground_truth": 0}, {"key": "386e149797954c4b5cd52bcad0beece29f7eb04a", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.7994423210609213, "ground_truth": 0}, {"key": "25abfd6bf83eb62bdd4daf1f542d61b54ab2871d", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.879146757885039, "ground_truth": 0}, {"key": "25abfd6bf83eb62bdd4daf1f542d61b54ab2871d", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.8840392769544735, "ground_truth": 0}, {"key": "25abfd6bf83eb62bdd4daf1f542d61b54ab2871d", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.9026096022422856, "ground_truth": 0}, {"key": "25abfd6bf83eb62bdd4daf1f542d61b54ab2871d", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.8529354821414569, "ground_truth": 0}, {"key": "25abfd6bf83eb62bdd4daf1f542d61b54ab2871d", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.8679338454339555, "ground_truth": 0}, {"key": "e5e0f9ea6381d513d4632644634d7c12e1c6c4cb", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.817574479782837, "ground_truth": 0}, {"key": "e5e0f9ea6381d513d4632644634d7c12e1c6c4cb", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.7772998645929902, "ground_truth": 0}, {"key": "e5e0f9ea6381d513d4632644634d7c12e1c6c4cb", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.7905303186854009, "ground_truth": 0}, {"key": "e5e0f9ea6381d513d4632644634d7c12e1c6c4cb", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.8365545622449481, "ground_truth": 0}, {"key": "e5e0f9ea6381d513d4632644634d7c12e1c6c4cb", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.7106283012970926, "ground_truth": 0}, {"key": "4e660c57fb36c03622b3ff9f9d0e78a0f7b0aea9", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.426321588930789, "ground_truth": 0}, {"key": "4e660c57fb36c03622b3ff9f9d0e78a0f7b0aea9", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.5869964297671043, "ground_truth": 0}, {"key": "4e660c57fb36c03622b3ff9f9d0e78a0f7b0aea9", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.544801410046245, "ground_truth": 0}, {"key": "4e660c57fb36c03622b3ff9f9d0e78a0f7b0aea9", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.6825737176760097, "ground_truth": 0}, {"key": "4e660c57fb36c03622b3ff9f9d0e78a0f7b0aea9", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.5544704660028826, "ground_truth": 0}, {"key": "586458cf89c9c2ddc5a7925e275f135245f5a0fc", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.7799929021083539, "ground_truth": 0}, {"key": "586458cf89c9c2ddc5a7925e275f135245f5a0fc", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.8140527893166654, "ground_truth": 0}, {"key": "586458cf89c9c2ddc5a7925e275f135245f5a0fc", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.8732148376212914, "ground_truth": 0}, {"key": "586458cf89c9c2ddc5a7925e275f135245f5a0fc", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.957596171301754, "ground_truth": 0}, {"key": "586458cf89c9c2ddc5a7925e275f135245f5a0fc", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.6740504776361447, "ground_truth": 0}, {"key": "8aca433d3662b6ffe76ef4026bdcd7cf784aacec", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.41679665768546903, "ground_truth": 0}, {"key": "8aca433d3662b6ffe76ef4026bdcd7cf784aacec", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.41489883739761735, "ground_truth": 0}, {"key": "8aca433d3662b6ffe76ef4026bdcd7cf784aacec", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.35577488691287484, "ground_truth": 0}, {"key": "8aca433d3662b6ffe76ef4026bdcd7cf784aacec", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.4551986070760327, "ground_truth": 0}, {"key": "8aca433d3662b6ffe76ef4026bdcd7cf784aacec", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.3468730843410669, "ground_truth": 0}, {"key": "066f8568d9c1c23ca3aeb23330123e7dd8967208", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.9246877056942019, "ground_truth": 0}, {"key": "066f8568d9c1c23ca3aeb23330123e7dd8967208", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.8449215306809349, "ground_truth": 0}, {"key": "066f8568d9c1c23ca3aeb23330123e7dd8967208", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.8152324966700596, "ground_truth": 0}, {"key": "066f8568d9c1c23ca3aeb23330123e7dd8967208", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.9039745175726553, "ground_truth": 0}, {"key": "066f8568d9c1c23ca3aeb23330123e7dd8967208", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.7431680085673164, "ground_truth": 0}, {"key": "6589398915f67576609586704d5bcca6538c4727", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.8998277822199467, "ground_truth": 0}, {"key": "6589398915f67576609586704d5bcca6538c4727", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.880797071246672, "ground_truth": 0}, {"key": "6589398915f67576609586704d5bcca6538c4727", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.8558511560095522, "ground_truth": 0}, {"key": "6589398915f67576609586704d5bcca6538c4727", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.969324197672491, "ground_truth": 0}, {"key": "6589398915f67576609586704d5bcca6538c4727", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.8740772334524879, "ground_truth": 0}, {"key": "cb4d9818866490b281e8f5529c9957ba366390e7", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.46684559290506733, "ground_truth": 0}, {"key": "cb4d9818866490b281e8f5529c9957ba366390e7", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.6039318402036791, "ground_truth": 0}, {"key": "cb4d9818866490b281e8f5529c9957ba366390e7", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.4035668592820111, "ground_truth": 0}, {"key": "cb4d9818866490b281e8f5529c9957ba366390e7", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.45907612859731833, "ground_truth": 0}, {"key": "cb4d9818866490b281e8f5529c9957ba366390e7", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.5409238620458844, "ground_truth": 0}, {"key": "83181eb5628b02f9af1cf8be0b9e3d7841f6f94c", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.554470475891967, "ground_truth": 0}, {"key": "83181eb5628b02f9af1cf8be0b9e3d7841f6f94c", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.8529354866364739, "ground_truth": 0}, {"key": "83181eb5628b02f9af1cf8be0b9e3d7841f6f94c", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.7325918483983406, "ground_truth": 0}, {"key": "83181eb5628b02f9af1cf8be0b9e3d7841f6f94c", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.8568122989277858, "ground_truth": 0}, {"key": "83181eb5628b02f9af1cf8be0b9e3d7841f6f94c", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.7217432138013514, "ground_truth": 0}, {"key": "addda21620885e1019305bce0cbf308b421dc0ba", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.4921881175086938, "ground_truth": 0}, {"key": "addda21620885e1019305bce0cbf308b421dc0ba", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.5234203578008747, "ground_truth": 0}, {"key": "addda21620885e1019305bce0cbf308b421dc0ba", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.1883239877567054, "ground_truth": 0}, {"key": "addda21620885e1019305bce0cbf308b421dc0ba", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.49218813856779137, "ground_truth": 0}, {"key": "addda21620885e1019305bce0cbf308b421dc0ba", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.30404168078630023, "ground_truth": 0}, {"key": "6a0a6f44de4059e1d7ef83841b3fd5e95e278ba2", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.5253688323327573, "ground_truth": 0}, {"key": "6a0a6f44de4059e1d7ef83841b3fd5e95e278ba2", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.4785288352939764, "ground_truth": 0}, {"key": "6a0a6f44de4059e1d7ef83841b3fd5e95e278ba2", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.6224593332245478, "ground_truth": 0}, {"key": "6a0a6f44de4059e1d7ef83841b3fd5e95e278ba2", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.687630001018022, "ground_truth": 0}, {"key": "6a0a6f44de4059e1d7ef83841b3fd5e95e278ba2", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.6150878485475718, "ground_truth": 0}, {"key": "b5313efdec6d9afa6f43f26378c6065fcc9c7535", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.7401743579981992, "ground_truth": 0}, {"key": "b5313efdec6d9afa6f43f26378c6065fcc9c7535", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.7074047112062498, "ground_truth": 0}, {"key": "b5313efdec6d9afa6f43f26378c6065fcc9c7535", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.47852884546799196, "ground_truth": 0}, {"key": "b5313efdec6d9afa6f43f26378c6065fcc9c7535", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.8499711721849592, "ground_truth": 0}, {"key": "b5313efdec6d9afa6f43f26378c6065fcc9c7535", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.6132365388859021, "ground_truth": 0}, {"key": "0644f27692b67af8f52f9518e29981de11684cd7", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.9666631755894173, "ground_truth": 0}, {"key": "0644f27692b67af8f52f9518e29981de11684cd7", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.9453993904709009, "ground_truth": 0}, {"key": "0644f27692b67af8f52f9518e29981de11684cd7", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.8918110422733159, "ground_truth": 0}, {"key": "0644f27692b67af8f52f9518e29981de11684cd7", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.9750122041595997, "ground_truth": 0}, {"key": "0644f27692b67af8f52f9518e29981de11684cd7", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.9507778827549024, "ground_truth": 0}, {"key": "19dbfe3918d9bdd7b5f1792631c5e3e424146473", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.7732163776048687, "ground_truth": 0}, {"key": "19dbfe3918d9bdd7b5f1792631c5e3e424146473", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.9224823430183723, "ground_truth": 0}, {"key": "19dbfe3918d9bdd7b5f1792631c5e3e424146473", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.7866228335023473, "ground_truth": 0}, {"key": "19dbfe3918d9bdd7b5f1792631c5e3e424146473", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.6976089140572374, "ground_truth": 0}, {"key": "19dbfe3918d9bdd7b5f1792631c5e3e424146473", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.6619228706100274, "ground_truth": 0}, {"key": "0f4fcaf8fd58c40bc31c4715cd230bb0f80f2d98", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.48242911815712636, "ground_truth": 0}, {"key": "0f4fcaf8fd58c40bc31c4715cd230bb0f80f2d98", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.45713671027140845, "ground_truth": 0}, {"key": "0f4fcaf8fd58c40bc31c4715cd230bb0f80f2d98", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.3738758178204244, "ground_truth": 0}, {"key": "0f4fcaf8fd58c40bc31c4715cd230bb0f80f2d98", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.30239108179711366, "ground_truth": 0}, {"key": "0f4fcaf8fd58c40bc31c4715cd230bb0f80f2d98", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.426321585485743, "ground_truth": 0}, {"key": "4aa90d4a364e8bd252a2a2e57f1bb4c9dab57062", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.5058591223082078, "ground_truth": 0}, {"key": "4aa90d4a364e8bd252a2a2e57f1bb4c9dab57062", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.42059958439803896, "ground_truth": 0}, {"key": "4aa90d4a364e8bd252a2a2e57f1bb4c9dab57062", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.2974699502192985, "ground_truth": 0}, {"key": "4aa90d4a364e8bd252a2a2e57f1bb4c9dab57062", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.34864513081022525, "ground_truth": 0}, {"key": "4aa90d4a364e8bd252a2a2e57f1bb4c9dab57062", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.41111087216508024, "ground_truth": 0}, {"key": "239d0e3b504e4b9e1e6eb20eb77c8a873a2f5657", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.5945512670095756, "ground_truth": 0}, {"key": "239d0e3b504e4b9e1e6eb20eb77c8a873a2f5657", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.5964331661682182, "ground_truth": 0}, {"key": "239d0e3b504e4b9e1e6eb20eb77c8a873a2f5657", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.7217432115780285, "ground_truth": 0}, {"key": "239d0e3b504e4b9e1e6eb20eb77c8a873a2f5657", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.7956581005141043, "ground_truth": 0}, {"key": "239d0e3b504e4b9e1e6eb20eb77c8a873a2f5657", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.7956580834631298, "ground_truth": 0}, {"key": "6ef705715b84a961f971d624e9574da6a65dd3ef", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.6706082629151799, "ground_truth": 0}, {"key": "6ef705715b84a961f971d624e9574da6a65dd3ef", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.8697145816218488, "ground_truth": 0}, {"key": "6ef705715b84a961f971d624e9574da6a65dd3ef", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.7704648018713159, "ground_truth": 0}, {"key": "6ef705715b84a961f971d624e9574da6a65dd3ef", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.622459332274445, "ground_truth": 0}, {"key": "6ef705715b84a961f971d624e9574da6a65dd3ef", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.7416740383835283, "ground_truth": 0}, {"key": "e3f24714630bd679c4b4fdb77e90f785beb1ff33", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.44360043504510066, "ground_truth": 0}, {"key": "e3f24714630bd679c4b4fdb77e90f785beb1ff33", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.5312093770940822, "ground_truth": 0}, {"key": "e3f24714630bd679c4b4fdb77e90f785beb1ff33", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.674050475791573, "ground_truth": 0}, {"key": "e3f24714630bd679c4b4fdb77e90f785beb1ff33", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.7416740170780167, "ground_truth": 0}, {"key": "e3f24714630bd679c4b4fdb77e90f785beb1ff33", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.47852883246856465, "ground_truth": 0}, {"key": "589dc58218fe8920f0949cc7af767b6daf5018bc", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.38676344462693785, "ground_truth": 0}, {"key": "589dc58218fe8920f0949cc7af767b6daf5018bc", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.7866228313762611, "ground_truth": 0}, {"key": "589dc58218fe8920f0949cc7af767b6daf5018bc", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.685949460291597, "ground_truth": 0}, {"key": "589dc58218fe8920f0949cc7af767b6daf5018bc", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.7295197884590434, "ground_truth": 0}, {"key": "589dc58218fe8920f0949cc7af767b6daf5018bc", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.8418256535542876, "ground_truth": 0}, {"key": "06254d21e94c9c0b027629a1df90298887c31f14", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.6187804364988749, "ground_truth": 0}, {"key": "06254d21e94c9c0b027629a1df90298887c31f14", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.3468730894690243, "ground_truth": 0}, {"key": "06254d21e94c9c0b027629a1df90298887c31f14", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.34510529582330396, "ground_truth": 0}, {"key": "06254d21e94c9c0b027629a1df90298887c31f14", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.2877678215673846, "ground_truth": 0}, {"key": "06254d21e94c9c0b027629a1df90298887c31f14", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.552539722400367, "ground_truth": 0}, {"key": "5b93cafa2843ab23eb5baf8bb0bec93d0fc46864", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.9155072454886555, "ground_truth": 0}, {"key": "5b93cafa2843ab23eb5baf8bb0bec93d0fc46864", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.793105956460054, "ground_truth": 0}, {"key": "5b93cafa2843ab23eb5baf8bb0bec93d0fc46864", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.9334308104133651, "ground_truth": 0}, {"key": "5b93cafa2843ab23eb5baf8bb0bec93d0fc46864", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.888758782252952, "ground_truth": 0}, {"key": "5b93cafa2843ab23eb5baf8bb0bec93d0fc46864", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.8386797527884713, "ground_truth": 0}, {"key": "22f9667453cf7ea8a39080edde645776d5edc6f7", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.3106943902209993, "ground_truth": 0}, {"key": "22f9667453cf7ea8a39080edde645776d5edc6f7", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.18952109409723517, "ground_truth": 0}, {"key": "22f9667453cf7ea8a39080edde645776d5edc6f7", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.1655931228442091, "ground_truth": 0}, {"key": "22f9667453cf7ea8a39080edde645776d5edc6f7", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.10302442983651251, "ground_truth": 0}, {"key": "22f9667453cf7ea8a39080edde645776d5edc6f7", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.20307462332715276, "ground_truth": 0}, {"key": "521fc18da417d441ba600a4abdbf279bb0c8f69d", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.45907613011481907, "ground_truth": 0}, {"key": "521fc18da417d441ba600a4abdbf279bb0c8f69d", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.5907791732977763, "ground_truth": 0}, {"key": "521fc18da417d441ba600a4abdbf279bb0c8f69d", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.8499711840069227, "ground_truth": 0}, {"key": "521fc18da417d441ba600a4abdbf279bb0c8f69d", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.6095241465986849, "ground_truth": 0}, {"key": "521fc18da417d441ba600a4abdbf279bb0c8f69d", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.8587185744387678, "ground_truth": 0}, {"key": "48fd5553806beaaa508596b0c8267a1ee703a8fe", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.4843800855371561, "ground_truth": 0}, {"key": "48fd5553806beaaa508596b0c8267a1ee703a8fe", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.724870289105736, "ground_truth": 0}, {"key": "48fd5553806beaaa508596b0c8267a1ee703a8fe", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.5350984173996572, "ground_truth": 0}, {"key": "48fd5553806beaaa508596b0c8267a1ee703a8fe", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.5813030899352593, "ground_truth": 0}, {"key": "48fd5553806beaaa508596b0c8267a1ee703a8fe", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.7074047140643688, "ground_truth": 0}, {"key": "f9b3e0253b7325cd0d37841a38c9f10a22c77c49", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.8300437621144402, "ground_truth": 0}, {"key": "f9b3e0253b7325cd0d37841a38c9f10a22c77c49", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.7549149973402488, "ground_truth": 0}, {"key": "f9b3e0253b7325cd0d37841a38c9f10a22c77c49", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.7295198106863882, "ground_truth": 0}, {"key": "f9b3e0253b7325cd0d37841a38c9f10a22c77c49", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.7606506457919355, "ground_truth": 0}, {"key": "f9b3e0253b7325cd0d37841a38c9f10a22c77c49", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.6876300110954751, "ground_truth": 0}, {"key": "3228a9d82b3829a4f09698b746db4036ebb38ad0", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.5813030972223644, "ground_truth": 0}, {"key": "3228a9d82b3829a4f09698b746db4036ebb38ad0", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.6370307886624755, "ground_truth": 0}, {"key": "3228a9d82b3829a4f09698b746db4036ebb38ad0", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.3979383813939741, "ground_truth": 0}, {"key": "3228a9d82b3829a4f09698b746db4036ebb38ad0", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.5195213024318792, "ground_truth": 0}, {"key": "3228a9d82b3829a4f09698b746db4036ebb38ad0", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.7401743497280382, "ground_truth": 0}, {"key": "ee02f2bd6eaf55c06fef208248197679d2d96897", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.5389832042814778, "ground_truth": 0}, {"key": "ee02f2bd6eaf55c06fef208248197679d2d96897", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.4668456231058671, "ground_truth": 0}, {"key": "ee02f2bd6eaf55c06fef208248197679d2d96897", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.373875829686106, "ground_truth": 0}, {"key": "ee02f2bd6eaf55c06fef208248197679d2d96897", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.7008947872287672, "ground_truth": 0}, {"key": "ee02f2bd6eaf55c06fef208248197679d2d96897", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.5869964524651717, "ground_truth": 0}, {"key": "c8da607c6ffe49104ceacd4fe484581042e7f21a", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.7106282983109209, "ground_truth": 0}, {"key": "c8da607c6ffe49104ceacd4fe484581042e7f21a", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.4397473515638782, "ground_truth": 0}, {"key": "c8da607c6ffe49104ceacd4fe484581042e7f21a", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.26284183261201316, "ground_truth": 0}, {"key": "c8da607c6ffe49104ceacd4fe484581042e7f21a", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.5544704623022423, "ground_truth": 0}, {"key": "c8da607c6ffe49104ceacd4fe484581042e7f21a", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.7892336971139406, "ground_truth": 0}, {"key": "aeca50944e5a49735193304117849531fb4d667d", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.8031737852018652, "ground_truth": 0}, {"key": "aeca50944e5a49735193304117849531fb4d667d", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.567936617914399, "ground_truth": 0}, {"key": "aeca50944e5a49735193304117849531fb4d667d", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.6315942807738325, "ground_truth": 0}, {"key": "aeca50944e5a49735193304117849531fb4d667d", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.5019531277352541, "ground_truth": 0}, {"key": "aeca50944e5a49735193304117849531fb4d667d", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.7476159579363678, "ground_truth": 0}, {"key": "301c27b4468420252a14f4c87c2b208c6b3259e1", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.26284185487813594, "ground_truth": 0}, {"key": "301c27b4468420252a14f4c87c2b208c6b3259e1", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.40356685425685945, "ground_truth": 0}, {"key": "301c27b4468420252a14f4c87c2b208c6b3259e1", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.3849121479303396, "ground_truth": 0}, {"key": "301c27b4468420252a14f4c87c2b208c6b3259e1", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.3757064941609507, "ground_truth": 0}, {"key": "301c27b4468420252a14f4c87c2b208c6b3259e1", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.424411984090001, "ground_truth": 0}, {"key": "9b5fc45f61bff9323a7744c1db605618763cb85c", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.3720487918760216, "ground_truth": 0}, {"key": "9b5fc45f61bff9323a7744c1db605618763cb85c", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.5888891551363369, "ground_truth": 0}, {"key": "9b5fc45f61bff9323a7744c1db605618763cb85c", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.304041687000775, "ground_truth": 0}, {"key": "9b5fc45f61bff9323a7744c1db605618763cb85c", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.29421496158074195, "ground_truth": 0}, {"key": "9b5fc45f61bff9323a7744c1db605618763cb85c", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.24220563457339458, "ground_truth": 0}, {"key": "43144b95b0f947f2c6d40122fecd69ced8a4af92", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.7074047266289274, "ground_truth": 0}, {"key": "43144b95b0f947f2c6d40122fecd69ced8a4af92", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.6992544219881824, "ground_truth": 0}, {"key": "43144b95b0f947f2c6d40122fecd69ced8a4af92", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.6095241529393238, "ground_truth": 0}, {"key": "43144b95b0f947f2c6d40122fecd69ced8a4af92", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.6206215940810794, "ground_truth": 0}, {"key": "43144b95b0f947f2c6d40122fecd69ced8a4af92", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.705785023034469, "ground_truth": 0}, {"key": "58b49fef1d6d2be5211848adc2882b59f043a933", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.4941408832961863, "ground_truth": 0}, {"key": "58b49fef1d6d2be5211848adc2882b59f043a933", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.6825737302937722, "ground_truth": 0}, {"key": "58b49fef1d6d2be5211848adc2882b59f043a933", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.5486734966207129, "ground_truth": 0}, {"key": "58b49fef1d6d2be5211848adc2882b59f043a933", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.4532618571749703, "ground_truth": 0}, {"key": "58b49fef1d6d2be5211848adc2882b59f043a933", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.6926419917639913, "ground_truth": 0}, {"key": "bdcc1253f679b14e54451db44f4f0e39af4bb559", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.6370308016680633, "ground_truth": 0}, {"key": "bdcc1253f679b14e54451db44f4f0e39af4bb559", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.5851011786479922, "ground_truth": 0}, {"key": "bdcc1253f679b14e54451db44f4f0e39af4bb559", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.6442251249858555, "ground_truth": 0}, {"key": "bdcc1253f679b14e54451db44f4f0e39af4bb559", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.7106283055463943, "ground_truth": 0}, {"key": "bdcc1253f679b14e54451db44f4f0e39af4bb559", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.7505527574160825, "ground_truth": 0}, {"key": "b22b1636da5dd15364b6f0c342e4ce4903e51c2a", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.9086179015654157, "ground_truth": 0}, {"key": "b22b1636da5dd15364b6f0c342e4ce4903e51c2a", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.9012274151012102, "ground_truth": 0}, {"key": "b22b1636da5dd15364b6f0c342e4ce4903e51c2a", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.8164063864429724, "ground_truth": 0}, {"key": "b22b1636da5dd15364b6f0c342e4ce4903e51c2a", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.891811048094067, "ground_truth": 0}, {"key": "b22b1636da5dd15364b6f0c342e4ce4903e51c2a", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.868826784161139, "ground_truth": 0}, {"key": "55986d11e0d0e5b031567157cf1f157610c65c31", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.635222402258335, "ground_truth": 0}, {"key": "55986d11e0d0e5b031567157cf1f157610c65c31", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.7310585894199005, "ground_truth": 0}, {"key": "55986d11e0d0e5b031567157cf1f157610c65c31", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.7185943881304248, "ground_truth": 0}, {"key": "55986d11e0d0e5b031567157cf1f157610c65c31", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.7122321845642205, "ground_truth": 0}, {"key": "55986d11e0d0e5b031567157cf1f157610c65c31", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.33111976214175687, "ground_truth": 0}, {"key": "0a37124fe35e31ae9fe8dd7715aeed88002e23e9", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.6206216118621897, "ground_truth": 0}, {"key": "0a37124fe35e31ae9fe8dd7715aeed88002e23e9", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.3904758259886832, "ground_truth": 0}, {"key": "0a37124fe35e31ae9fe8dd7715aeed88002e23e9", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.5660185036829084, "ground_truth": 0}, {"key": "0a37124fe35e31ae9fe8dd7715aeed88002e23e9", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.7041601330434447, "ground_truth": 0}, {"key": "0a37124fe35e31ae9fe8dd7715aeed88002e23e9", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.3451052899781039, "ground_truth": 0}, {"key": "ef3ee3ab85ed8802b6b76444bccb46256077963e", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.32766829349580473, "ground_truth": 0}, {"key": "ef3ee3ab85ed8802b6b76444bccb46256077963e", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.23091975390370637, "ground_truth": 0}, {"key": "ef3ee3ab85ed8802b6b76444bccb46256077963e", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.37204877750827936, "ground_truth": 0}, {"key": "ef3ee3ab85ed8802b6b76444bccb46256077963e", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.13846179855039226, "ground_truth": 0}, {"key": "ef3ee3ab85ed8802b6b76444bccb46256077963e", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.48633154204734946, "ground_truth": 0}, {"key": "fb17ac082bd3f3af3dad8c8d36d9ea56360c520e", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.6893056156424054, "ground_truth": 0}, {"key": "fb17ac082bd3f3af3dad8c8d36d9ea56360c520e", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.680878597001079, "ground_truth": 0}, {"key": "fb17ac082bd3f3af3dad8c8d36d9ea56360c520e", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.5964331466996262, "ground_truth": 0}, {"key": "fb17ac082bd3f3af3dad8c8d36d9ea56360c520e", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.6187804433603703, "ground_truth": 0}, {"key": "fb17ac082bd3f3af3dad8c8d36d9ea56360c520e", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.7217431925374794, "ground_truth": 0}, {"key": "59f079f6095cbb82b0eaaa0ba5fc29cdaff1f81b", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.45519861117665333, "ground_truth": 0}, {"key": "59f079f6095cbb82b0eaaa0ba5fc29cdaff1f81b", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.6039318449522642, "ground_truth": 0}, {"key": "59f079f6095cbb82b0eaaa0ba5fc29cdaff1f81b", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.7431680024324905, "ground_truth": 0}, {"key": "59f079f6095cbb82b0eaaa0ba5fc29cdaff1f81b", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.7371581496901285, "ground_truth": 0}, {"key": "59f079f6095cbb82b0eaaa0ba5fc29cdaff1f81b", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.2643583591711592, "ground_truth": 0}, {"key": "083bc4309f2ea52be2a378e78566d7dcc9f4dd73", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.6424324893115613, "ground_truth": 0}, {"key": "083bc4309f2ea52be2a378e78566d7dcc9f4dd73", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.7813306358329147, "ground_truth": 0}, {"key": "083bc4309f2ea52be2a378e78566d7dcc9f4dd73", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.8244619310195587, "ground_truth": 0}, {"key": "083bc4309f2ea52be2a378e78566d7dcc9f4dd73", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.6242935201601026, "ground_truth": 0}, {"key": "083bc4309f2ea52be2a378e78566d7dcc9f4dd73", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.6206216219370042, "ground_truth": 0}, {"key": "ac56bd50e449bfa1d7b923415afa2ae5f7c83392", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.8714748642849663, "ground_truth": 0}, {"key": "ac56bd50e449bfa1d7b923415afa2ae5f7c83392", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.8407825963076522, "ground_truth": 0}, {"key": "ac56bd50e449bfa1d7b923415afa2ae5f7c83392", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.7248702953000389, "ground_truth": 0}, {"key": "ac56bd50e449bfa1d7b923415afa2ae5f7c83392", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.8300437592569301, "ground_truth": 0}, {"key": "ac56bd50e449bfa1d7b923415afa2ae5f7c83392", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.5983121888608091, "ground_truth": 0}, {"key": "61e4747776bd844146a9b8c7c1913c827ffbcd8a", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.9284087978948319, "ground_truth": 0}, {"key": "61e4747776bd844146a9b8c7c1913c827ffbcd8a", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.8962513761375651, "ground_truth": 0}, {"key": "61e4747776bd844146a9b8c7c1913c827ffbcd8a", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.9626731132197377, "ground_truth": 0}, {"key": "61e4747776bd844146a9b8c7c1913c827ffbcd8a", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.9059898180902066, "ground_truth": 0}, {"key": "61e4747776bd844146a9b8c7c1913c827ffbcd8a", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.9563089383607125, "ground_truth": 0}, {"key": "a9854fc40719b0d083a3fd279b6196188228a4e0", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.5019531208894601, "ground_truth": 0}, {"key": "a9854fc40719b0d083a3fd279b6196188228a4e0", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.6039318466751722, "ground_truth": 0}, {"key": "a9854fc40719b0d083a3fd279b6196188228a4e0", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.46684562768003485, "ground_truth": 0}, {"key": "a9854fc40719b0d083a3fd279b6196188228a4e0", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.6169358315997173, "ground_truth": 0}, {"key": "a9854fc40719b0d083a3fd279b6196188228a4e0", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.5621764808054528, "ground_truth": 0}, {"key": "8d37ab9fcd0248c093f6d0e5682782ebdaf5e837", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.8438950847097865, "ground_truth": 0}, {"key": "8d37ab9fcd0248c093f6d0e5682782ebdaf5e837", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.7008948043711314, "ground_truth": 0}, {"key": "8d37ab9fcd0248c093f6d0e5682782ebdaf5e837", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.7201715119384242, "ground_truth": 0}, {"key": "8d37ab9fcd0248c093f6d0e5682782ebdaf5e837", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.6688802599044696, "ground_truth": 0}, {"key": "8d37ab9fcd0248c093f6d0e5682782ebdaf5e837", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.8386797568603712, "ground_truth": 0}, {"key": "d3199d123dedcdbae55b2e9d1f658717c1d5e233", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.513668445849296, "ground_truth": 0}, {"key": "d3199d123dedcdbae55b2e9d1f658717c1d5e233", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.33633107682619645, "ground_truth": 0}, {"key": "d3199d123dedcdbae55b2e9d1f658717c1d5e233", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.4244120012231932, "ground_truth": 0}, {"key": "d3199d123dedcdbae55b2e9d1f658717c1d5e233", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.6876299864673244, "ground_truth": 0}, {"key": "d3199d123dedcdbae55b2e9d1f658717c1d5e233", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.5679366047712672, "ground_truth": 0}, {"key": "f249ede5a3cafd2506ff2bb400291a7db1c43b76", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.7310585749520478, "ground_truth": 0}, {"key": "f249ede5a3cafd2506ff2bb400291a7db1c43b76", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.3311197422140125, "ground_truth": 0}, {"key": "f249ede5a3cafd2506ff2bb400291a7db1c43b76", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.41869694353578607, "ground_truth": 0}, {"key": "f249ede5a3cafd2506ff2bb400291a7db1c43b76", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.4590761334260426, "ground_truth": 0}, {"key": "f249ede5a3cafd2506ff2bb400291a7db1c43b76", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.6057990306407462, "ground_truth": 0}, {"key": "6343a202a70e8c5d3bfa4042bfd087d78ca5805e", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.43398145944771005, "ground_truth": 0}, {"key": "6343a202a70e8c5d3bfa4042bfd087d78ca5805e", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.5945512732630472, "ground_truth": 0}, {"key": "6343a202a70e8c5d3bfa4042bfd087d78ca5805e", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.40168781823972094, "ground_truth": 0}, {"key": "6343a202a70e8c5d3bfa4042bfd087d78ca5805e", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.39420094865557553, "ground_truth": 0}, {"key": "6343a202a70e8c5d3bfa4042bfd087d78ca5805e", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.3056973139374586, "ground_truth": 0}, {"key": "da0d41b431367b51fd995573cb498c10b7f64ca0", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.6297746247480962, "ground_truth": 0}, {"key": "da0d41b431367b51fd995573cb498c10b7f64ca0", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.5983121905459748, "ground_truth": 0}, {"key": "da0d41b431367b51fd995573cb498c10b7f64ca0", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.3504213669643475, "ground_truth": 0}, {"key": "da0d41b431367b51fd995573cb498c10b7f64ca0", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.5389832186106397, "ground_truth": 0}, {"key": "da0d41b431367b51fd995573cb498c10b7f64ca0", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.6113819787653125, "ground_truth": 0}, {"key": "0620ff5fa324a35b4be54bbd2de49b42bdd0d7c0", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.786622841866822, "ground_truth": 0}, {"key": "0620ff5fa324a35b4be54bbd2de49b42bdd0d7c0", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.83004375970432, "ground_truth": 0}, {"key": "0620ff5fa324a35b4be54bbd2de49b42bdd0d7c0", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.8344068845018432, "ground_truth": 0}, {"key": "0620ff5fa324a35b4be54bbd2de49b42bdd0d7c0", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.7892336874782735, "ground_truth": 0}, {"key": "0620ff5fa324a35b4be54bbd2de49b42bdd0d7c0", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.7648916142987833, "ground_truth": 0}, {"key": "f0eb8f9eee266512eb604a51b482833e202531d8", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.3942009352435563, "ground_truth": 0}, {"key": "f0eb8f9eee266512eb604a51b482833e202531d8", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.5679366144131038, "ground_truth": 0}, {"key": "f0eb8f9eee266512eb604a51b482833e202531d8", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.5640984641819161, "ground_truth": 0}, {"key": "f0eb8f9eee266512eb604a51b482833e202531d8", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.8198933424088231, "ground_truth": 0}, {"key": "f0eb8f9eee266512eb604a51b482833e202531d8", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.8840392876212354, "ground_truth": 0}, {"key": "c8f743307d5d1f7f19f1474d68c9390b22f6d076", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.6548947396420793, "ground_truth": 0}, {"key": "c8f743307d5d1f7f19f1474d68c9390b22f6d076", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.5926665953691095, "ground_truth": 0}, {"key": "c8f743307d5d1f7f19f1474d68c9390b22f6d076", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.8031737980566391, "ground_truth": 0}, {"key": "c8f743307d5d1f7f19f1474d68c9390b22f6d076", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.707404707592424, "ground_truth": 0}, {"key": "c8f743307d5d1f7f19f1474d68c9390b22f6d076", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.8128673244470593, "ground_truth": 0}, {"key": "5978abfdad91e604840a2dcc993df5ade9448e82", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.8679338551531518, "ground_truth": 0}, {"key": "5978abfdad91e604840a2dcc993df5ade9448e82", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.8872046027257491, "ground_truth": 0}, {"key": "5978abfdad91e604840a2dcc993df5ade9448e82", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.8469578450696967, "ground_truth": 0}, {"key": "5978abfdad91e604840a2dcc993df5ade9448e82", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.8140527907871982, "ground_truth": 0}, {"key": "5978abfdad91e604840a2dcc993df5ade9448e82", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.9012274069292373, "ground_truth": 0}, {"key": "5bcd4e61b39cc7ffff38ad88cd40afa208b18528", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.5832033331362211, "ground_truth": 0}, {"key": "5bcd4e61b39cc7ffff38ad88cd40afa208b18528", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.8807970736949983, "ground_truth": 0}, {"key": "5bcd4e61b39cc7ffff38ad88cd40afa208b18528", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.7217431967203942, "ground_truth": 0}, {"key": "5bcd4e61b39cc7ffff38ad88cd40afa208b18528", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.8006920236921314, "ground_truth": 0}, {"key": "5bcd4e61b39cc7ffff38ad88cd40afa208b18528", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.809275974434675, "ground_truth": 0}, {"key": "44815c184e3013f07781311b30ec5ff009174738", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.5, "ground_truth": 0}, {"key": "44815c184e3013f07781311b30ec5ff009174738", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.37570647958528275, "ground_truth": 0}, {"key": "44815c184e3013f07781311b30ec5ff009174738", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.602061563588715, "ground_truth": 0}, {"key": "44815c184e3013f07781311b30ec5ff009174738", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.5, "ground_truth": 0}, {"key": "44815c184e3013f07781311b30ec5ff009174738", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.32939171825049085, "ground_truth": 0}, {"key": "d7783bd2bf5ad92156962380342411c2eb068853", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.8679338535912701, "ground_truth": 0}, {"key": "d7783bd2bf5ad92156962380342411c2eb068853", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.8006920005682947, "ground_truth": 0}, {"key": "d7783bd2bf5ad92156962380342411c2eb068853", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.778649314206809, "ground_truth": 0}, {"key": "d7783bd2bf5ad92156962380342411c2eb068853", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.7505527706079669, "ground_truth": 0}, {"key": "d7783bd2bf5ad92156962380342411c2eb068853", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.9005297918762731, "ground_truth": 0}, {"key": "4963edb0ad2703e9f6c54593149d9b81e7ada91f", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.4610167908389993, "ground_truth": 0}, {"key": "4963edb0ad2703e9f6c54593149d9b81e7ada91f", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.5214711696824554, "ground_truth": 0}, {"key": "4963edb0ad2703e9f6c54593149d9b81e7ada91f", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.6442251203310023, "ground_truth": 0}, {"key": "4963edb0ad2703e9f6c54593149d9b81e7ada91f", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.49023564003586995, "ground_truth": 0}, {"key": "4963edb0ad2703e9f6c54593149d9b81e7ada91f", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.7461389927316707, "ground_truth": 0}, {"key": "51b9a2d46dac43952e713874a5769be5ae350626", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.8407825956026151, "ground_truth": 0}, {"key": "51b9a2d46dac43952e713874a5769be5ae350626", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.6909762854791954, "ground_truth": 0}, {"key": "51b9a2d46dac43952e713874a5769be5ae350626", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.6315942835647116, "ground_truth": 0}, {"key": "51b9a2d46dac43952e713874a5769be5ae350626", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.6495786265849909, "ground_truth": 0}, {"key": "51b9a2d46dac43952e713874a5769be5ae350626", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.6370307864285156, "ground_truth": 0}, {"key": "d670da295571f998bd0864540e2acd109d077131", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.6825737398349994, "ground_truth": 0}, {"key": "d670da295571f998bd0864540e2acd109d077131", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.5583269959216428, "ground_truth": 0}, {"key": "d670da295571f998bd0864540e2acd109d077131", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.7041601361296825, "ground_truth": 0}, {"key": "d670da295571f998bd0864540e2acd109d077131", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.6406358487638103, "ground_truth": 0}, {"key": "d670da295571f998bd0864540e2acd109d077131", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.7732163671691525, "ground_truth": 0}, {"key": "f2f2246150d06734b2fab694a39bd8d693c7d255", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.6791786943186894, "ground_truth": 0}, {"key": "f2f2246150d06734b2fab694a39bd8d693c7d255", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.5506073901336451, "ground_truth": 0}, {"key": "f2f2246150d06734b2fab694a39bd8d693c7d255", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.6370308174846404, "ground_truth": 0}, {"key": "f2f2246150d06734b2fab694a39bd8d693c7d255", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.36477757490853996, "ground_truth": 0}, {"key": "f2f2246150d06734b2fab694a39bd8d693c7d255", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.6584175068919355, "ground_truth": 0}, {"key": "3cc0409612242093f34ea1d8ca1679f434955cff", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.573678418234377, "ground_truth": 0}, {"key": "3cc0409612242093f34ea1d8ca1679f434955cff", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.6406358589828607, "ground_truth": 0}, {"key": "3cc0409612242093f34ea1d8ca1679f434955cff", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.585101160880917, "ground_truth": 0}, {"key": "3cc0409612242093f34ea1d8ca1679f434955cff", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.4092207894088666, "ground_truth": 0}, {"key": "3cc0409612242093f34ea1d8ca1679f434955cff", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.64422511382926, "ground_truth": 0}, {"key": "a67c4eaf797da7df18a715cd30c6cf11db96c954", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.4359015320016275, "ground_truth": 0}, {"key": "a67c4eaf797da7df18a715cd30c6cf11db96c954", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.4746311785447936, "ground_truth": 0}, {"key": "a67c4eaf797da7df18a715cd30c6cf11db96c954", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.33458944721568973, "ground_truth": 0}, {"key": "a67c4eaf797da7df18a715cd30c6cf11db96c954", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.48047870301841716, "ground_truth": 0}, {"key": "a67c4eaf797da7df18a715cd30c6cf11db96c954", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.647798220664922, "ground_truth": 0}, {"key": "58456413c8bd03a8ce70eb0061af07c6a9824fc3", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.3979384155958009, "ground_truth": 0}, {"key": "58456413c8bd03a8ce70eb0061af07c6a9824fc3", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.4111108558169905, "ground_truth": 0}, {"key": "58456413c8bd03a8ce70eb0061af07c6a9824fc3", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.4513265066795419, "ground_truth": 0}, {"key": "58456413c8bd03a8ce70eb0061af07c6a9824fc3", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.5273165275593135, "ground_truth": 0}, {"key": "58456413c8bd03a8ce70eb0061af07c6a9824fc3", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.21866939740350377, "ground_truth": 0}, {"key": "da040b67082b56436ccc8479a4e435cbf892a1f2", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.39233684067959823, "ground_truth": 0}, {"key": "da040b67082b56436ccc8479a4e435cbf892a1f2", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.297469964812232, "ground_truth": 0}, {"key": "da040b67082b56436ccc8479a4e435cbf892a1f2", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.290980865225628, "ground_truth": 0}, {"key": "da040b67082b56436ccc8479a4e435cbf892a1f2", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.4436004318417326, "ground_truth": 0}, {"key": "da040b67082b56436ccc8479a4e435cbf892a1f2", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.3140505602863804, "ground_truth": 0}, {"key": "c71748bb246a2b05e676862b75b38fa03bf6646e", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.2877678020026092, "ground_truth": 0}, {"key": "c71748bb246a2b05e676862b75b38fa03bf6646e", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.34334174038815884, "ground_truth": 0}, {"key": "c71748bb246a2b05e676862b75b38fa03bf6646e", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.4016878049566989, "ground_truth": 0}, {"key": "c71748bb246a2b05e676862b75b38fa03bf6646e", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.3293917185944875, "ground_truth": 0}, {"key": "c71748bb246a2b05e676862b75b38fa03bf6646e", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.3849121591413974, "ground_truth": 0}, {"key": "800f8dc06596c30444526bf31dd0db7504391a82", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.6706082868706562, "ground_truth": 0}, {"key": "800f8dc06596c30444526bf31dd0db7504391a82", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.8714748709956811, "ground_truth": 0}, {"key": "800f8dc06596c30444526bf31dd0db7504391a82", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.9012274177461065, "ground_truth": 0}, {"key": "800f8dc06596c30444526bf31dd0db7504391a82", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.7185943922650639, "ground_truth": 0}, {"key": "800f8dc06596c30444526bf31dd0db7504391a82", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.8714748649901233, "ground_truth": 0}, {"key": "3b0ed227dc7e5292e302183282d8bbe23d7b1db2", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.2351083868602412, "ground_truth": 0}, {"key": "3b0ed227dc7e5292e302183282d8bbe23d7b1db2", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.3398276281418915, "ground_truth": 0}, {"key": "3b0ed227dc7e5292e302183282d8bbe23d7b1db2", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.33111974445052256, "ground_truth": 0}, {"key": "3b0ed227dc7e5292e302183282d8bbe23d7b1db2", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.4824291191846681, "ground_truth": 0}, {"key": "3b0ed227dc7e5292e302183282d8bbe23d7b1db2", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.488283393997984, "ground_truth": 0}, {"key": "1e713005e16983f75222235967c0cbeb0b944f80", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.6808786133978749, "ground_truth": 0}, {"key": "1e713005e16983f75222235967c0cbeb0b944f80", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.5312093735416088, "ground_truth": 0}, {"key": "1e713005e16983f75222235967c0cbeb0b944f80", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.871474873454145, "ground_truth": 0}, {"key": "1e713005e16983f75222235967c0cbeb0b944f80", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.7772998603917806, "ground_truth": 0}, {"key": "1e713005e16983f75222235967c0cbeb0b944f80", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.8386797774090514, "ground_truth": 0}, {"key": "360ae10bc8bd30a2aca7bc6b7000e138af63adb1", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.828938818811215, "ground_truth": 0}, {"key": "360ae10bc8bd30a2aca7bc6b7000e138af63adb1", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.7786493108111853, "ground_truth": 0}, {"key": "360ae10bc8bd30a2aca7bc6b7000e138af63adb1", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.7620700960749472, "ground_truth": 0}, {"key": "360ae10bc8bd30a2aca7bc6b7000e138af63adb1", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.718594382394825, "ground_truth": 0}, {"key": "360ae10bc8bd30a2aca7bc6b7000e138af63adb1", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.9381240106979762, "ground_truth": 0}, {"key": "50e996059a005d15e3e89b5a3c3695309671ed34", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.7386690719819587, "ground_truth": 0}, {"key": "50e996059a005d15e3e89b5a3c3695309671ed34", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.7185943890921105, "ground_truth": 0}, {"key": "50e996059a005d15e3e89b5a3c3695309671ed34", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.9136765142303402, "ground_truth": 0}, {"key": "50e996059a005d15e3e89b5a3c3695309671ed34", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.7943849760304735, "ground_truth": 0}, {"key": "50e996059a005d15e3e89b5a3c3695309671ed34", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.6976089159274322, "ground_truth": 0}, {"key": "ccc7f6a2139593c47f6b5880f1e3eef9e7a69734", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.19930800671758558, "ground_truth": 0}, {"key": "ccc7f6a2139593c47f6b5880f1e3eef9e7a69734", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.31573597271908443, "ground_truth": 0}, {"key": "ccc7f6a2139593c47f6b5880f1e3eef9e7a69734", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.30239108281174865, "ground_truth": 0}, {"key": "ccc7f6a2139593c47f6b5880f1e3eef9e7a69734", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.33458944070238444, "ground_truth": 0}, {"key": "ccc7f6a2139593c47f6b5880f1e3eef9e7a69734", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.3073580142472447, "ground_truth": 0}, {"key": "f4f90d4ff5af3e3648055673e040f0f43ae076d2", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.7041601403879441, "ground_truth": 0}, {"key": "f4f90d4ff5af3e3648055673e040f0f43ae076d2", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.8577680997698959, "ground_truth": 0}, {"key": "f4f90d4ff5af3e3648055673e040f0f43ae076d2", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.46490156615559114, "ground_truth": 0}, {"key": "f4f90d4ff5af3e3648055673e040f0f43ae076d2", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.6774740063426387, "ground_truth": 0}, {"key": "f4f90d4ff5af3e3648055673e040f0f43ae076d2", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.7732163802039352, "ground_truth": 0}, {"key": "6c9ec6b9d3e936d2394f74354d577fdfcdd985a3", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.45907612840064577, "ground_truth": 0}, {"key": "6c9ec6b9d3e936d2394f74354d577fdfcdd985a3", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.7772998481716182, "ground_truth": 0}, {"key": "6c9ec6b9d3e936d2394f74354d577fdfcdd985a3", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.6242935311882923, "ground_truth": 0}, {"key": "6c9ec6b9d3e936d2394f74354d577fdfcdd985a3", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.5926666038404532, "ground_truth": 0}, {"key": "6c9ec6b9d3e936d2394f74354d577fdfcdd985a3", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.3593641499150336, "ground_truth": 0}, {"key": "438a2046f4465fb1f6dab1cb327ef9ca86a4cc0d", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.41300361277223974, "ground_truth": 0}, {"key": "438a2046f4465fb1f6dab1cb327ef9ca86a4cc0d", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.5019531361834229, "ground_truth": 0}, {"key": "438a2046f4465fb1f6dab1cb327ef9ca86a4cc0d", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.6169358157248745, "ground_truth": 0}, {"key": "438a2046f4465fb1f6dab1cb327ef9ca86a4cc0d", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.7279754637821072, "ground_truth": 0}, {"key": "438a2046f4465fb1f6dab1cb327ef9ca86a4cc0d", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.6057990342452497, "ground_truth": 0}, {"key": "73818f6c987b3604b8bc92c4fb03bc68af196b77", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.39233684146539954, "ground_truth": 0}, {"key": "73818f6c987b3604b8bc92c4fb03bc68af196b77", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.3849121690589594, "ground_truth": 0}, {"key": "73818f6c987b3604b8bc92c4fb03bc68af196b77", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.29746995642080276, "ground_truth": 0}, {"key": "73818f6c987b3604b8bc92c4fb03bc68af196b77", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.5563995909800078, "ground_truth": 0}, {"key": "73818f6c987b3604b8bc92c4fb03bc68af196b77", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.39793841281653863, "ground_truth": 0}, {"key": "f06d91f46326752b02cdc48e8fa472dcc38a0846", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.5097643675317088, "ground_truth": 0}, {"key": "f06d91f46326752b02cdc48e8fa472dcc38a0846", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.7008948146768194, "ground_truth": 0}, {"key": "f06d91f46326752b02cdc48e8fa472dcc38a0846", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.4493926357106675, "ground_truth": 0}, {"key": "f06d91f46326752b02cdc48e8fa472dcc38a0846", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.5698526374469057, "ground_truth": 0}, {"key": "f06d91f46326752b02cdc48e8fa472dcc38a0846", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.5945512628254352, "ground_truth": 0}, {"key": "c54bee6384d58517757ad5a8a30ea6dc59980a07", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.3040416811902451, "ground_truth": 0}, {"key": "c54bee6384d58517757ad5a8a30ea6dc59980a07", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.45907614145914105, "ground_truth": 0}, {"key": "c54bee6384d58517757ad5a8a30ea6dc59980a07", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.3775406737184897, "ground_truth": 0}, {"key": "c54bee6384d58517757ad5a8a30ea6dc59980a07", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.2845760082491372, "ground_truth": 0}, {"key": "c54bee6384d58517757ad5a8a30ea6dc59980a07", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.5563995966241614, "ground_truth": 0}, {"key": "2757ff294ae08e977ed6a2b6e1854210f28f12c9", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.6636689553645073, "ground_truth": 0}, {"key": "2757ff294ae08e977ed6a2b6e1854210f28f12c9", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.8661325069227718, "ground_truth": 0}, {"key": "2757ff294ae08e977ed6a2b6e1854210f28f12c9", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.8749346149901571, "ground_truth": 0}, {"key": "2757ff294ae08e977ed6a2b6e1854210f28f12c9", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.7620700976325481, "ground_truth": 0}, {"key": "2757ff294ae08e977ed6a2b6e1854210f28f12c9", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.8643104440183232, "ground_truth": 0}, {"key": "6a004c991c482f664ab8ac78df0bda26860b1c7a", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.2909808791806908, "ground_truth": 0}, {"key": "6a004c991c482f664ab8ac78df0bda26860b1c7a", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.46879063151245554, "ground_truth": 0}, {"key": "6a004c991c482f664ab8ac78df0bda26860b1c7a", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.43974732574252906, "ground_truth": 0}, {"key": "6a004c991c482f664ab8ac78df0bda26860b1c7a", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.3415825271080846, "ground_truth": 0}, {"key": "6a004c991c482f664ab8ac78df0bda26860b1c7a", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.3345894171466441, "ground_truth": 0}, {"key": "69159eadf4dcb2b7850f3a4db6454f8209f33e3a", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.674050498633127, "ground_truth": 0}, {"key": "69159eadf4dcb2b7850f3a4db6454f8209f33e3a", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.8092759608282282, "ground_truth": 0}, {"key": "69159eadf4dcb2b7850f3a4db6454f8209f33e3a", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.6893056110175022, "ground_truth": 0}, {"key": "69159eadf4dcb2b7850f3a4db6454f8209f33e3a", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.7826624776987032, "ground_truth": 0}, {"key": "69159eadf4dcb2b7850f3a4db6454f8209f33e3a", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.8365545542036188, "ground_truth": 0}, {"key": "c6129a4c1fbd5680f512da18fb60a19a74f4959e", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.6706082862682843, "ground_truth": 0}, {"key": "c6129a4c1fbd5680f512da18fb60a19a74f4959e", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.5907791940594826, "ground_truth": 0}, {"key": "c6129a4c1fbd5680f512da18fb60a19a74f4959e", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.5525397078689046, "ground_truth": 0}, {"key": "c6129a4c1fbd5680f512da18fb60a19a74f4959e", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.8509647060763671, "ground_truth": 0}, {"key": "c6129a4c1fbd5680f512da18fb60a19a74f4959e", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.7520125546184377, "ground_truth": 0}, {"key": "1fe7d16db2c7a742dc1bcf04bfb8e285e7909f03", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.8577681134767122, "ground_truth": 0}, {"key": "1fe7d16db2c7a742dc1bcf04bfb8e285e7909f03", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.9059898176425055, "ground_truth": 0}, {"key": "1fe7d16db2c7a742dc1bcf04bfb8e285e7909f03", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.8221891285138498, "ground_truth": 0}, {"key": "1fe7d16db2c7a742dc1bcf04bfb8e285e7909f03", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.8300437722658047, "ground_truth": 0}, {"key": "1fe7d16db2c7a742dc1bcf04bfb8e285e7909f03", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.8548846398986808, "ground_truth": 0}, {"key": "e0ddf766661004eb3ff337d95e249073410f0755", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.789233697738836, "ground_truth": 0}, {"key": "e0ddf766661004eb3ff337d95e249073410f0755", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.806852625997292, "ground_truth": 0}, {"key": "e0ddf766661004eb3ff337d95e249073410f0755", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.24944723041256245, "ground_truth": 0}, {"key": "e0ddf766661004eb3ff337d95e249073410f0755", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.7799928924180032, "ground_truth": 0}, {"key": "e0ddf766661004eb3ff337d95e249073410f0755", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.7386690686586634, "ground_truth": 0}, {"key": "dd37d70b837b24247e9abafe8fb5bc5fae5de464", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.6531269023080469, "ground_truth": 0}, {"key": "dd37d70b837b24247e9abafe8fb5bc5fae5de464", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.6206216306371997, "ground_truth": 0}, {"key": "dd37d70b837b24247e9abafe8fb5bc5fae5de464", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.6261241773652058, "ground_truth": 0}, {"key": "dd37d70b837b24247e9abafe8fb5bc5fae5de464", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.590779205890259, "ground_truth": 0}, {"key": "dd37d70b837b24247e9abafe8fb5bc5fae5de464", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.5794004099622257, "ground_truth": 0}, {"key": "6e3028e9ae17ab59abc7732fe840468ac9dcb60c", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.5175708845726932, "ground_truth": 0}, {"key": "6e3028e9ae17ab59abc7732fe840468ac9dcb60c", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.515619903644525, "ground_truth": 0}, {"key": "6e3028e9ae17ab59abc7732fe840468ac9dcb60c", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.3451052826126325, "ground_truth": 0}, {"key": "6e3028e9ae17ab59abc7732fe840468ac9dcb60c", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.36658974027702423, "ground_truth": 0}, {"key": "6e3028e9ae17ab59abc7732fe840468ac9dcb60c", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.47073661344644957, "ground_truth": 0}, {"key": "24d2f15f65bfb5608c75d19ba07fc410aab4d9c6", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.9299510394867685, "ground_truth": 0}, {"key": "24d2f15f65bfb5608c75d19ba07fc410aab4d9c6", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.9324533094674862, "ground_truth": 0}, {"key": "24d2f15f65bfb5608c75d19ba07fc410aab4d9c6", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.93534650842111, "ground_truth": 0}, {"key": "24d2f15f65bfb5608c75d19ba07fc410aab4d9c6", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.8489722041567058, "ground_truth": 0}, {"key": "24d2f15f65bfb5608c75d19ba07fc410aab4d9c6", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.9449947159339603, "ground_truth": 0}, {"key": "698329cc7a8d796d7635bf59d2435aa22c1a38e6", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.3259495164837357, "ground_truth": 0}, {"key": "698329cc7a8d796d7635bf59d2435aa22c1a38e6", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.7279754551584944, "ground_truth": 0}, {"key": "698329cc7a8d796d7635bf59d2435aa22c1a38e6", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.3522017533451981, "ground_truth": 0}, {"key": "698329cc7a8d796d7635bf59d2435aa22c1a38e6", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.35756753528841995, "ground_truth": 0}, {"key": "698329cc7a8d796d7635bf59d2435aa22c1a38e6", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.6442251189469784, "ground_truth": 0}, {"key": "b531a8ba685e8d461d0a491f35c9970c3dddf3dd", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.6206216216491233, "ground_truth": 0}, {"key": "b531a8ba685e8d461d0a491f35c9970c3dddf3dd", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.7446563292803577, "ground_truth": 0}, {"key": "b531a8ba685e8d461d0a491f35c9970c3dddf3dd", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.6671476885816351, "ground_truth": 0}, {"key": "b531a8ba685e8d461d0a491f35c9970c3dddf3dd", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.7371581655468086, "ground_truth": 0}, {"key": "b531a8ba685e8d461d0a491f35c9970c3dddf3dd", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.7918210711827739, "ground_truth": 0}, {"key": "5b0e686b4679910743337ce02b36dd71a5caf5eb", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.15507847163067212, "ground_truth": 0}, {"key": "5b0e686b4679910743337ce02b36dd71a5caf5eb", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.4359015109617741, "ground_truth": 0}, {"key": "5b0e686b4679910743337ce02b36dd71a5caf5eb", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.3007455876640428, "ground_truth": 0}, {"key": "5b0e686b4679910743337ce02b36dd71a5caf5eb", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.3886180226854101, "ground_truth": 0}, {"key": "5b0e686b4679910743337ce02b36dd71a5caf5eb", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.16559311609591573, "ground_truth": 0}, {"key": "980e6db610d9882443d61e36d955f02d983d3e76", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.7759445522742843, "ground_truth": 0}, {"key": "980e6db610d9882443d61e36d955f02d983d3e76", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.712232154457573, "ground_truth": 0}, {"key": "980e6db610d9882443d61e36d955f02d983d3e76", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.6132365555327037, "ground_truth": 0}, {"key": "980e6db610d9882443d61e36d955f02d983d3e76", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.874077237323982, "ground_truth": 0}, {"key": "980e6db610d9882443d61e36d955f02d983d3e76", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.684264055485556, "ground_truth": 0}, {"key": "6c18984d8f30ce196e9399200dd15e373e699267", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.7122322182846276, "ground_truth": 0}, {"key": "6c18984d8f30ce196e9399200dd15e373e699267", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.6909762990991126, "ground_truth": 0}, {"key": "6c18984d8f30ce196e9399200dd15e373e699267", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.7401743650107084, "ground_truth": 0}, {"key": "6c18984d8f30ce196e9399200dd15e373e699267", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.5370413765239918, "ground_truth": 0}, {"key": "6c18984d8f30ce196e9399200dd15e373e699267", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.6460137231058051, "ground_truth": 0}, {"key": "e00f05efe2038fffc8eaa1e8eecbe9445a9483e5", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.6636689474642831, "ground_truth": 0}, {"key": "e00f05efe2038fffc8eaa1e8eecbe9445a9483e5", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.6297746125539309, "ground_truth": 0}, {"key": "e00f05efe2038fffc8eaa1e8eecbe9445a9483e5", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.5983121807419655, "ground_truth": 0}, {"key": "e00f05efe2038fffc8eaa1e8eecbe9445a9483e5", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.6442251046273353, "ground_truth": 0}, {"key": "e00f05efe2038fffc8eaa1e8eecbe9445a9483e5", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.5058591087200748, "ground_truth": 0}, {"key": "9ce109dc50fe4eca8b2d0c926d5dbd1df5f49187", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.6169358192798742, "ground_truth": 0}, {"key": "9ce109dc50fe4eca8b2d0c926d5dbd1df5f49187", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.5544704794759533, "ground_truth": 0}, {"key": "9ce109dc50fe4eca8b2d0c926d5dbd1df5f49187", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.6095241624806084, "ground_truth": 0}, {"key": "9ce109dc50fe4eca8b2d0c926d5dbd1df5f49187", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.6706082934579831, "ground_truth": 0}, {"key": "9ce109dc50fe4eca8b2d0c926d5dbd1df5f49187", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.47657966445274413, "ground_truth": 0}, {"key": "bbec538b4453859ee9c772c4de8f0eb28acd87c4", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.7786493213979692, "ground_truth": 0}, {"key": "bbec538b4453859ee9c772c4de8f0eb28acd87c4", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.727975451204212, "ground_truth": 0}, {"key": "bbec538b4453859ee9c772c4de8f0eb28acd87c4", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.7416740158634497, "ground_truth": 0}, {"key": "bbec538b4453859ee9c772c4de8f0eb28acd87c4", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.7310585754345508, "ground_truth": 0}, {"key": "bbec538b4453859ee9c772c4de8f0eb28acd87c4", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.8289388139180642, "ground_truth": 0}, {"key": "c4e0587d1b8fcc06c2cc5cfcec42a34d314fbe44", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.6334102633568264, "ground_truth": 0}, {"key": "c4e0587d1b8fcc06c2cc5cfcec42a34d314fbe44", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.5736784119275061, "ground_truth": 0}, {"key": "c4e0587d1b8fcc06c2cc5cfcec42a34d314fbe44", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.7943849608644926, "ground_truth": 0}, {"key": "c4e0587d1b8fcc06c2cc5cfcec42a34d314fbe44", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.7138307424368586, "ground_truth": 0}, {"key": "c4e0587d1b8fcc06c2cc5cfcec42a34d314fbe44", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.7826624813694152, "ground_truth": 0}, {"key": "7eaaa5bfe35344ee85eeb871a4d31cd31b12965b", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.8438951027270616, "ground_truth": 0}, {"key": "7eaaa5bfe35344ee85eeb871a4d31cd31b12965b", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.8548846454231995, "ground_truth": 0}, {"key": "7eaaa5bfe35344ee85eeb871a4d31cd31b12965b", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.7534666637879068, "ground_truth": 0}, {"key": "7eaaa5bfe35344ee85eeb871a4d31cd31b12965b", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.6477981970477815, "ground_truth": 0}, {"key": "7eaaa5bfe35344ee85eeb871a4d31cd31b12965b", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.8056321756088575, "ground_truth": 0}, {"key": "9cce7373a54faccf5b5d1232c82afab9b29ab6b9", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.6926419910579176, "ground_truth": 0}, {"key": "9cce7373a54faccf5b5d1232c82afab9b29ab6b9", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.6757645940455718, "ground_truth": 0}, {"key": "9cce7373a54faccf5b5d1232c82afab9b29ab6b9", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.7892337076436403, "ground_truth": 0}, {"key": "9cce7373a54faccf5b5d1232c82afab9b29ab6b9", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.7008948227608777, "ground_truth": 0}, {"key": "9cce7373a54faccf5b5d1232c82afab9b29ab6b9", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.6976089152340702, "ground_truth": 0}, {"key": "1b37e549bbcec859711e5b2ef310e94deed4dc95", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.8499711868717872, "ground_truth": 0}, {"key": "1b37e549bbcec859711e5b2ef310e94deed4dc95", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.787931187764403, "ground_truth": 0}, {"key": "1b37e549bbcec859711e5b2ef310e94deed4dc95", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.7490872094937201, "ground_truth": 0}, {"key": "1b37e549bbcec859711e5b2ef310e94deed4dc95", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.7074047141091685, "ground_truth": 0}, {"key": "1b37e549bbcec859711e5b2ef310e94deed4dc95", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.684264032933735, "ground_truth": 0}, {"key": "da780ee614304d195bde3b7549313c02990d072e", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.7201715062872945, "ground_truth": 0}, {"key": "da780ee614304d195bde3b7549313c02990d072e", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.8056321884529962, "ground_truth": 0}, {"key": "da780ee614304d195bde3b7549313c02990d072e", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.7201715107487061, "ground_truth": 0}, {"key": "da780ee614304d195bde3b7549313c02990d072e", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.7057850379473359, "ground_truth": 0}, {"key": "da780ee614304d195bde3b7549313c02990d072e", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.7994423406284016, "ground_truth": 0}, {"key": "e24cdc200182d698a34f564ba71f4948ce6760e5", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.3923368340961594, "ground_truth": 0}, {"key": "e24cdc200182d698a34f564ba71f4948ce6760e5", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.4804786777837685, "ground_truth": 0}, {"key": "e24cdc200182d698a34f564ba71f4948ce6760e5", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.7416740129018028, "ground_truth": 0}, {"key": "e24cdc200182d698a34f564ba71f4948ce6760e5", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.7943849509190516, "ground_truth": 0}, {"key": "e24cdc200182d698a34f564ba71f4948ce6760e5", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.658417494206248, "ground_truth": 0}, {"key": "42483672c204aebcf7ba6e7d6ca4c628fe9a69e7", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.39233682383483287, "ground_truth": 0}, {"key": "42483672c204aebcf7ba6e7d6ca4c628fe9a69e7", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.6513548398923157, "ground_truth": 0}, {"key": "42483672c204aebcf7ba6e7d6ca4c628fe9a69e7", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.5448013894593151, "ground_truth": 0}, {"key": "42483672c204aebcf7ba6e7d6ca4c628fe9a69e7", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.6334102801385079, "ground_truth": 0}, {"key": "42483672c204aebcf7ba6e7d6ca4c628fe9a69e7", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.687629997192465, "ground_truth": 0}, {"key": "3501c83d3dab4a2e4d2142522a4bf1510a64422a", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.5078118714128428, "ground_truth": 0}, {"key": "3501c83d3dab4a2e4d2142522a4bf1510a64422a", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.39606817073498907, "ground_truth": 0}, {"key": "3501c83d3dab4a2e4d2142522a4bf1510a64422a", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.23231014752915413, "ground_truth": 0}, {"key": "3501c83d3dab4a2e4d2142522a4bf1510a64422a", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.23510838109867457, "ground_truth": 0}, {"key": "3501c83d3dab4a2e4d2142522a4bf1510a64422a", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.31573597571558254, "ground_truth": 0}, {"key": "964589248c2d95ac3c734ad71283ca22ae4ecedf", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.36658975420532247, "ground_truth": 0}, {"key": "964589248c2d95ac3c734ad71283ca22ae4ecedf", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.5832033696199066, "ground_truth": 0}, {"key": "964589248c2d95ac3c734ad71283ca22ae4ecedf", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.7154239802703339, "ground_truth": 0}, {"key": "964589248c2d95ac3c734ad71283ca22ae4ecedf", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.602061584092241, "ground_truth": 0}, {"key": "964589248c2d95ac3c734ad71283ca22ae4ecedf", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.5195213160613905, "ground_truth": 0}, {"key": "6b72550a663bcb7a64e242ede6da53b1f585ea71", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.7549149807542331, "ground_truth": 0}, {"key": "6b72550a663bcb7a64e242ede6da53b1f585ea71", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.8092759794669029, "ground_truth": 0}, {"key": "6b72550a663bcb7a64e242ede6da53b1f585ea71", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.6566582513149798, "ground_truth": 0}, {"key": "6b72550a663bcb7a64e242ede6da53b1f585ea71", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.6723316920014661, "ground_truth": 0}, {"key": "6b72550a663bcb7a64e242ede6da53b1f585ea71", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.8479677538465838, "ground_truth": 0}, {"key": "c96bdfc0463d994ddc858ad358fe59371be79352", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.3486451213106828, "ground_truth": 0}, {"key": "c96bdfc0463d994ddc858ad358fe59371be79352", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.6424324999630452, "ground_truth": 0}, {"key": "c96bdfc0463d994ddc858ad358fe59371be79352", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.5039061609627274, "ground_truth": 0}, {"key": "c96bdfc0463d994ddc858ad358fe59371be79352", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.41869691765186995, "ground_truth": 0}, {"key": "c96bdfc0463d994ddc858ad358fe59371be79352", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.6057990409416316, "ground_truth": 0}, {"key": "085dc5d706487da983655043b144952956cb3c5b", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.30735801828884246, "ground_truth": 0}, {"key": "085dc5d706487da983655043b144952956cb3c5b", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.5019531064835805, "ground_truth": 0}, {"key": "085dc5d706487da983655043b144952956cb3c5b", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.43590151876398897, "ground_truth": 0}, {"key": "085dc5d706487da983655043b144952956cb3c5b", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.42250462504470054, "ground_truth": 0}, {"key": "085dc5d706487da983655043b144952956cb3c5b", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.4416729863206099, "ground_truth": 0}, {"key": "1c1dc1da2f6ba045478e25e91c8e1b039ce4cc67", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.8031738162161298, "ground_truth": 0}, {"key": "1c1dc1da2f6ba045478e25e91c8e1b039ce4cc67", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.8449215286839127, "ground_truth": 0}, {"key": "1c1dc1da2f6ba045478e25e91c8e1b039ce4cc67", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.7969253715401339, "ground_truth": 0}, {"key": "1c1dc1da2f6ba045478e25e91c8e1b039ce4cc67", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.5195213144300074, "ground_truth": 0}, {"key": "1c1dc1da2f6ba045478e25e91c8e1b039ce4cc67", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.6548947260169896, "ground_truth": 0}, {"key": "da90eb668bfc66a5e70b2e6631a5ec1c9ffb2413", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.5117165916593871, "ground_truth": 0}, {"key": "da90eb668bfc66a5e70b2e6631a5ec1c9ffb2413", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.4707366329582738, "ground_truth": 0}, {"key": "da90eb668bfc66a5e70b2e6631a5ec1c9ffb2413", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.7853085985335537, "ground_truth": 0}, {"key": "da90eb668bfc66a5e70b2e6631a5ec1c9ffb2413", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.7534666458490579, "ground_truth": 0}, {"key": "da90eb668bfc66a5e70b2e6631a5ec1c9ffb2413", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.8539127509977928, "ground_truth": 0}, {"key": "717b1934db9eb0d7e5e2aef75cd54b29a6530a59", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.37204881064286, "ground_truth": 0}, {"key": "717b1934db9eb0d7e5e2aef75cd54b29a6530a59", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.5544704235293896, "ground_truth": 0}, {"key": "717b1934db9eb0d7e5e2aef75cd54b29a6530a59", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.585101155754032, "ground_truth": 0}, {"key": "717b1934db9eb0d7e5e2aef75cd54b29a6530a59", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.3904758181002578, "ground_truth": 0}, {"key": "717b1934db9eb0d7e5e2aef75cd54b29a6530a59", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.4687906124264564, "ground_truth": 0}, {"key": "e493fe7f282adb10c6b9af18d41f0181f17341e5", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.3208213130042918, "ground_truth": 0}, {"key": "e493fe7f282adb10c6b9af18d41f0181f17341e5", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.2351083834627991, "ground_truth": 0}, {"key": "e493fe7f282adb10c6b9af18d41f0181f17341e5", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.22270015590042785, "ground_truth": 0}, {"key": "e493fe7f282adb10c6b9af18d41f0181f17341e5", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.366589738124945, "ground_truth": 0}, {"key": "e493fe7f282adb10c6b9af18d41f0181f17341e5", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.25238403663954523, "ground_truth": 0}, {"key": "e510fc72b8ef595e45f1a510d0cad761ae1bd032", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.383064164263366, "ground_truth": 0}, {"key": "e510fc72b8ef595e45f1a510d0cad761ae1bd032", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.6039317903508106, "ground_truth": 0}, {"key": "e510fc72b8ef595e45f1a510d0cad761ae1bd032", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.37204877047553625, "ground_truth": 0}, {"key": "e510fc72b8ef595e45f1a510d0cad761ae1bd032", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.3225259816089462, "ground_truth": 0}, {"key": "e510fc72b8ef595e45f1a510d0cad761ae1bd032", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.2782567744422852, "ground_truth": 0}, {"key": "564e02cb944ea00c02f9832ab968441b5c67332e", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.7505527620044432, "ground_truth": 0}, {"key": "564e02cb944ea00c02f9832ab968441b5c67332e", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.7577943826138496, "ground_truth": 0}, {"key": "564e02cb944ea00c02f9832ab968441b5c67332e", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.6206216067250803, "ground_truth": 0}, {"key": "564e02cb944ea00c02f9832ab968441b5c67332e", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.8140528014560681, "ground_truth": 0}, {"key": "564e02cb944ea00c02f9832ab968441b5c67332e", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.8164063681173034, "ground_truth": 0}, {"key": "dfd0cea6589cb8be40538b9f165781fbc2c7d796", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.8783142513120777, "ground_truth": 0}, {"key": "dfd0cea6589cb8be40538b9f165781fbc2c7d796", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.5039061617372579, "ground_truth": 0}, {"key": "dfd0cea6589cb8be40538b9f165781fbc2c7d796", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.6943026840148712, "ground_truth": 0}, {"key": "dfd0cea6589cb8be40538b9f165781fbc2c7d796", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.7341195359512304, "ground_truth": 0}, {"key": "dfd0cea6589cb8be40538b9f165781fbc2c7d796", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.7892337114275656, "ground_truth": 0}, {"key": "dbceded6ea7d8a0944ab3f44263f688f644a5c37", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.5525397004928516, "ground_truth": 0}, {"key": "dbceded6ea7d8a0944ab3f44263f688f644a5c37", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.581303072114578, "ground_truth": 0}, {"key": "dbceded6ea7d8a0944ab3f44263f688f644a5c37", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.6943026853972687, "ground_truth": 0}, {"key": "dbceded6ea7d8a0944ab3f44263f688f644a5c37", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.496093817950555, "ground_truth": 0}, {"key": "dbceded6ea7d8a0944ab3f44263f688f644a5c37", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.7634837612289375, "ground_truth": 0}, {"key": "305a7272b28da5bc5574487ca0a09f48b852788c", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.3960681682814498, "ground_truth": 0}, {"key": "305a7272b28da5bc5574487ca0a09f48b852788c", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.4960938440934134, "ground_truth": 0}, {"key": "305a7272b28da5bc5574487ca0a09f48b852788c", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.3398276104776513, "ground_truth": 0}, {"key": "305a7272b28da5bc5574487ca0a09f48b852788c", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.40356683967772294, "ground_truth": 0}, {"key": "305a7272b28da5bc5574487ca0a09f48b852788c", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.43014732655415433, "ground_truth": 0}, {"key": "9814600b03458475607fa2e4e9f1637138b7c9bf", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.35577487626390514, "ground_truth": 0}, {"key": "9814600b03458475607fa2e4e9f1637138b7c9bf", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.6548947255076377, "ground_truth": 0}, {"key": "9814600b03458475607fa2e4e9f1637138b7c9bf", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.2991051953855508, "ground_truth": 0}, {"key": "9814600b03458475607fa2e4e9f1637138b7c9bf", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.69097629281155, "ground_truth": 0}, {"key": "9814600b03458475607fa2e4e9f1637138b7c9bf", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.7264256009104038, "ground_truth": 0}, {"key": "d16bff688345742ee8a1762cb6b82b49e4a065dd", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.8056321821791519, "ground_truth": 0}, {"key": "d16bff688345742ee8a1762cb6b82b49e4a065dd", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.6706082570662372, "ground_truth": 0}, {"key": "d16bff688345742ee8a1762cb6b82b49e4a065dd", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.7549149816365617, "ground_truth": 0}, {"key": "d16bff688345742ee8a1762cb6b82b49e4a065dd", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.6842640209516605, "ground_truth": 0}, {"key": "d16bff688345742ee8a1762cb6b82b49e4a065dd", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.7154239698523471, "ground_truth": 0}, {"key": "c85a7eb698c39c7465d1fe4ebbb50447329b5497", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.9618217254742013, "ground_truth": 0}, {"key": "c85a7eb698c39c7465d1fe4ebbb50447329b5497", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.9828232909588704, "ground_truth": 0}, {"key": "c85a7eb698c39c7465d1fe4ebbb50447329b5497", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.9722043756612788, "ground_truth": 0}, {"key": "c85a7eb698c39c7465d1fe4ebbb50447329b5497", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.9329437135877893, "ground_truth": 0}, {"key": "c85a7eb698c39c7465d1fe4ebbb50447329b5497", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.9761291658004313, "ground_truth": 0}, {"key": "5f299d74b492be5e53e6bcf3a54d3c8a4b418a97", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.3504213747121807, "ground_truth": 0}, {"key": "5f299d74b492be5e53e6bcf3a54d3c8a4b418a97", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.3157359895167925, "ground_truth": 0}, {"key": "5f299d74b492be5e53e6bcf3a54d3c8a4b418a97", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.30902370370380866, "ground_truth": 0}, {"key": "5f299d74b492be5e53e6bcf3a54d3c8a4b418a97", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.5292633880946033, "ground_truth": 0}, {"key": "5f299d74b492be5e53e6bcf3a54d3c8a4b418a97", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.16776335293379147, "ground_truth": 0}, {"key": "5a4e46a4e18d31d1ef4d1087b1643a349f10dd14", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.668880257124283, "ground_truth": 0}, {"key": "5a4e46a4e18d31d1ef4d1087b1643a349f10dd14", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.9372107932973526, "ground_truth": 0}, {"key": "5a4e46a4e18d31d1ef4d1087b1643a349f10dd14", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.7918210828317744, "ground_truth": 0}, {"key": "5a4e46a4e18d31d1ef4d1087b1643a349f10dd14", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.5983122072283638, "ground_truth": 0}, {"key": "5a4e46a4e18d31d1ef4d1087b1643a349f10dd14", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.6825737352012181, "ground_truth": 0}, {"key": "b6b7cbc40f51483708d53416719205f36c06f6df", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.5983121948463744, "ground_truth": 0}, {"key": "b6b7cbc40f51483708d53416719205f36c06f6df", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.8128673214260324, "ground_truth": 0}, {"key": "b6b7cbc40f51483708d53416719205f36c06f6df", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.9124361566916699, "ground_truth": 0}, {"key": "b6b7cbc40f51483708d53416719205f36c06f6df", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.6279512176378087, "ground_truth": 0}, {"key": "b6b7cbc40f51483708d53416719205f36c06f6df", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.6057990334461544, "ground_truth": 0}, {"key": "7c0bda3744be6f7d95eef695e59a4e4001455a35", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.33458943823711595, "ground_truth": 0}, {"key": "7c0bda3744be6f7d95eef695e59a4e4001455a35", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.7799929097959505, "ground_truth": 0}, {"key": "7c0bda3744be6f7d95eef695e59a4e4001455a35", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.5851011739213099, "ground_truth": 0}, {"key": "7c0bda3744be6f7d95eef695e59a4e4001455a35", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.4282333910731015, "ground_truth": 0}, {"key": "7c0bda3744be6f7d95eef695e59a4e4001455a35", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.5, "ground_truth": 0}, {"key": "f19b17438e69527f376e5d9efc74d19fbac6f755", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.8175744729663924, "ground_truth": 0}, {"key": "f19b17438e69527f376e5d9efc74d19fbac6f755", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.5525397298016097, "ground_truth": 0}, {"key": "f19b17438e69527f376e5d9efc74d19fbac6f755", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.5888891463402823, "ground_truth": 0}, {"key": "f19b17438e69527f376e5d9efc74d19fbac6f755", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.4726834799376056, "ground_truth": 0}, {"key": "f19b17438e69527f376e5d9efc74d19fbac6f755", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.7416740236388469, "ground_truth": 0}, {"key": "eb2fe21af9629392d61a4fabe6cad72130525f2f", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.3998116693816212, "ground_truth": 0}, {"key": "eb2fe21af9629392d61a4fabe6cad72130525f2f", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.5602526516450302, "ground_truth": 0}, {"key": "eb2fe21af9629392d61a4fabe6cad72130525f2f", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.651354889064768, "ground_truth": 0}, {"key": "eb2fe21af9629392d61a4fabe6cad72130525f2f", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.39981166822046954, "ground_truth": 0}, {"key": "eb2fe21af9629392d61a4fabe6cad72130525f2f", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.4590761009893018, "ground_truth": 0}, {"key": "eebebdc4fa08a6e927ab958a39d91f888550afec", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.6909763006229638, "ground_truth": 0}, {"key": "eebebdc4fa08a6e927ab958a39d91f888550afec", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.9372107932973526, "ground_truth": 0}, {"key": "eebebdc4fa08a6e927ab958a39d91f888550afec", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.8244619325874143, "ground_truth": 0}, {"key": "eebebdc4fa08a6e927ab958a39d91f888550afec", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.675764609740074, "ground_truth": 0}, {"key": "eebebdc4fa08a6e927ab958a39d91f888550afec", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.8428631531127113, "ground_truth": 0}, {"key": "94b15ad6efcd6d47dfcc242135be481fceb7f634", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.8714748627889556, "ground_truth": 0}, {"key": "94b15ad6efcd6d47dfcc242135be481fceb7f634", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.9105453867149208, "ground_truth": 0}, {"key": "94b15ad6efcd6d47dfcc242135be481fceb7f634", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.8056321760047789, "ground_truth": 0}, {"key": "94b15ad6efcd6d47dfcc242135be481fceb7f634", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.7704648005143188, "ground_truth": 0}, {"key": "94b15ad6efcd6d47dfcc242135be481fceb7f634", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.8449215271309521, "ground_truth": 0}, {"key": "504ed83e41a6a861927345f7a027ba53ad02237a", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.6150878473321172, "ground_truth": 0}, {"key": "504ed83e41a6a861927345f7a027ba53ad02237a", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.7008948043711314, "ground_truth": 0}, {"key": "504ed83e41a6a861927345f7a027ba53ad02237a", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.6774740018169143, "ground_truth": 0}, {"key": "504ed83e41a6a861927345f7a027ba53ad02237a", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.7371581571462054, "ground_truth": 0}, {"key": "504ed83e41a6a861927345f7a027ba53ad02237a", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.7759445624960299, "ground_truth": 0}, {"key": "42176b852f897ae19ef0cf39d598878c8ff0bced", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.4186969347060041, "ground_truth": 0}, {"key": "42176b852f897ae19ef0cf39d598878c8ff0bced", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.507811873930447, "ground_truth": 0}, {"key": "42176b852f897ae19ef0cf39d598878c8ff0bced", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.2829880861154508, "ground_truth": 0}, {"key": "42176b852f897ae19ef0cf39d598878c8ff0bced", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.334589456114619, "ground_truth": 0}, {"key": "42176b852f897ae19ef0cf39d598878c8ff0bced", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.3942009671988078, "ground_truth": 0}, {"key": "62ac534bf7e3e897b2726dddf2b7b6f7723362d4", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.756357545173748, "ground_truth": 0}, {"key": "62ac534bf7e3e897b2726dddf2b7b6f7723362d4", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.7745833922499235, "ground_truth": 0}, {"key": "62ac534bf7e3e897b2726dddf2b7b6f7723362d4", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.8116760102307696, "ground_truth": 0}, {"key": "62ac534bf7e3e897b2726dddf2b7b6f7723362d4", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.811676011586666, "ground_truth": 0}, {"key": "62ac534bf7e3e897b2726dddf2b7b6f7723362d4", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.6039318460725225, "ground_truth": 0}, {"key": "4ff05ae8454ad482f81911c5e4275b63466bea35", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.3960681569907911, "ground_truth": 0}, {"key": "4ff05ae8454ad482f81911c5e4275b63466bea35", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.35577487609862635, "ground_truth": 0}, {"key": "4ff05ae8454ad482f81911c5e4275b63466bea35", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.411110850170867, "ground_truth": 0}, {"key": "4ff05ae8454ad482f81911c5e4275b63466bea35", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.48828338646580677, "ground_truth": 0}, {"key": "4ff05ae8454ad482f81911c5e4275b63466bea35", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.562176509582252, "ground_truth": 0}, {"key": "16e86dc5e3fe27875ee927741542536ea7b7553b", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.6442251259196495, "ground_truth": 0}, {"key": "16e86dc5e3fe27875ee927741542536ea7b7553b", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.6584175157792587, "ground_truth": 0}, {"key": "16e86dc5e3fe27875ee927741542536ea7b7553b", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.5156199158841538, "ground_truth": 0}, {"key": "16e86dc5e3fe27875ee927741542536ea7b7553b", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.5736783740885405, "ground_truth": 0}, {"key": "16e86dc5e3fe27875ee927741542536ea7b7553b", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.6636689289557539, "ground_truth": 0}, {"key": "ad55d2f13db6732edcd716e09f527ed2df39946f", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.5602526672499936, "ground_truth": 0}, {"key": "ad55d2f13db6732edcd716e09f527ed2df39946f", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.25386100738003325, "ground_truth": 0}, {"key": "ad55d2f13db6732edcd716e09f527ed2df39946f", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.5039061801029957, "ground_truth": 0}, {"key": "ad55d2f13db6732edcd716e09f527ed2df39946f", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.579400422725653, "ground_truth": 0}, {"key": "ad55d2f13db6732edcd716e09f527ed2df39946f", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.44360042747871614, "ground_truth": 0}, {"key": "160228fe18f272761b969b08622ba868ad65b206", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.7704647960648272, "ground_truth": 0}, {"key": "160228fe18f272761b969b08622ba868ad65b206", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.7905303030020222, "ground_truth": 0}, {"key": "160228fe18f272761b969b08622ba868ad65b206", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.5078118760268298, "ground_truth": 0}, {"key": "160228fe18f272761b969b08622ba868ad65b206", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.6206216295268918, "ground_truth": 0}, {"key": "160228fe18f272761b969b08622ba868ad65b206", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.5583270176613591, "ground_truth": 0}, {"key": "7ebb75bc91aa51d53b06fdbed7feb52d42612065", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.7446563500727092, "ground_truth": 0}, {"key": "7ebb75bc91aa51d53b06fdbed7feb52d42612065", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.8740772292691302, "ground_truth": 0}, {"key": "7ebb75bc91aa51d53b06fdbed7feb52d42612065", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.904650538097271, "ground_truth": 0}, {"key": "7ebb75bc91aa51d53b06fdbed7feb52d42612065", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.8031737880303172, "ground_truth": 0}, {"key": "7ebb75bc91aa51d53b06fdbed7feb52d42612065", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.9099070005328045, "ground_truth": 0}, {"key": "a84e31bf36290e557a3080ad297177b6f18cdf84", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.8080672077080304, "ground_truth": 0}, {"key": "a84e31bf36290e557a3080ad297177b6f18cdf84", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.7905303152953242, "ground_truth": 0}, {"key": "a84e31bf36290e557a3080ad297177b6f18cdf84", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.8092759559136974, "ground_truth": 0}, {"key": "a84e31bf36290e557a3080ad297177b6f18cdf84", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.8723473775475473, "ground_truth": 0}, {"key": "a84e31bf36290e557a3080ad297177b6f18cdf84", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.7799928899829437, "ground_truth": 0}, {"key": "c43c7253f38ff2cd79770034ed9af3567cfaa811", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.7606506480689189, "ground_truth": 0}, {"key": "c43c7253f38ff2cd79770034ed9af3567cfaa811", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.6926419817249898, "ground_truth": 0}, {"key": "c43c7253f38ff2cd79770034ed9af3567cfaa811", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.769080246444734, "ground_truth": 0}, {"key": "c43c7253f38ff2cd79770034ed9af3567cfaa811", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.5312093999582574, "ground_truth": 0}, {"key": "c43c7253f38ff2cd79770034ed9af3567cfaa811", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.8175744766465768, "ground_truth": 0}, {"key": "a4601415eafb5264a4bdc273de3a16365aefb35b", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.4513265290524405, "ground_truth": 0}, {"key": "a4601415eafb5264a4bdc273de3a16365aefb35b", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.7233094672989527, "ground_truth": 0}, {"key": "a4601415eafb5264a4bdc273de3a16365aefb35b", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.38676342443013245, "ground_truth": 0}, {"key": "a4601415eafb5264a4bdc273de3a16365aefb35b", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.428233383180184, "ground_truth": 0}, {"key": "a4601415eafb5264a4bdc273de3a16365aefb35b", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.6859494553321163, "ground_truth": 0}, {"key": "91d43f137b3d928561fb62b200ae40aee4a34b73", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.8056321813613017, "ground_truth": 0}, {"key": "91d43f137b3d928561fb62b200ae40aee4a34b73", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.775944532363223, "ground_truth": 0}, {"key": "91d43f137b3d928561fb62b200ae40aee4a34b73", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.5717666021826346, "ground_truth": 0}, {"key": "91d43f137b3d928561fb62b200ae40aee4a34b73", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.7905303347748039, "ground_truth": 0}, {"key": "91d43f137b3d928561fb62b200ae40aee4a34b73", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.8568122897731576, "ground_truth": 0}, {"key": "ab2d99eedfd685ce685fa44e735695c27e946683", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.6976089054287113, "ground_truth": 0}, {"key": "ab2d99eedfd685ce685fa44e735695c27e946683", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.6020616165506334, "ground_truth": 0}, {"key": "ab2d99eedfd685ce685fa44e735695c27e946683", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.7577943614404246, "ground_truth": 0}, {"key": "ab2d99eedfd685ce685fa44e735695c27e946683", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.6477982073931148, "ground_truth": 0}, {"key": "ab2d99eedfd685ce685fa44e735695c27e946683", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.8499711763977544, "ground_truth": 0}, {"key": "df9c4e1b8698581720b28c71f1e98f82bd6ea6e6", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.6297746132520717, "ground_truth": 0}, {"key": "df9c4e1b8698581720b28c71f1e98f82bd6ea6e6", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.6297746326203403, "ground_truth": 0}, {"key": "df9c4e1b8698581720b28c71f1e98f82bd6ea6e6", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.5253688129506983, "ground_truth": 0}, {"key": "df9c4e1b8698581720b28c71f1e98f82bd6ea6e6", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.5736784048721006, "ground_truth": 0}, {"key": "df9c4e1b8698581720b28c71f1e98f82bd6ea6e6", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.5486734888031038, "ground_truth": 0}, {"key": "a1d7a119707506100920e1a6f0d9cbf4d4e7c838", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.5888891288364545, "ground_truth": 0}, {"key": "a1d7a119707506100920e1a6f0d9cbf4d4e7c838", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.4882833877309575, "ground_truth": 0}, {"key": "a1d7a119707506100920e1a6f0d9cbf4d4e7c838", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.5983121864592176, "ground_truth": 0}, {"key": "a1d7a119707506100920e1a6f0d9cbf4d4e7c838", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.4980468793877579, "ground_truth": 0}, {"key": "a1d7a119707506100920e1a6f0d9cbf4d4e7c838", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.4571367248219335, "ground_truth": 0}, {"key": "acd2b851b367bf62dd603ebff5670ffa9c853a8f", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.4035668714304259, "ground_truth": 0}, {"key": "acd2b851b367bf62dd603ebff5670ffa9c853a8f", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.3398276232924946, "ground_truth": 0}, {"key": "acd2b851b367bf62dd603ebff5670ffa9c853a8f", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.4474602944443103, "ground_truth": 0}, {"key": "acd2b851b367bf62dd603ebff5670ffa9c853a8f", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.3757064889739172, "ground_truth": 0}, {"key": "acd2b851b367bf62dd603ebff5670ffa9c853a8f", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.4921881262792535, "ground_truth": 0}, {"key": "b9f5a02386adb698ae71cadd3fd1825fa7b998db", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.16885694386199085, "ground_truth": 0}, {"key": "b9f5a02386adb698ae71cadd3fd1825fa7b998db", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.23934936497666692, "ground_truth": 0}, {"key": "b9f5a02386adb698ae71cadd3fd1825fa7b998db", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.15713684564933417, "ground_truth": 0}, {"key": "b9f5a02386adb698ae71cadd3fd1825fa7b998db", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.09534946318560363, "ground_truth": 0}, {"key": "b9f5a02386adb698ae71cadd3fd1825fa7b998db", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.1721718345202852, "ground_truth": 0}, {"key": "c26f356dc536e5797ba550be6e27a95059f1ce53", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.49609383190179773, "ground_truth": 0}, {"key": "c26f356dc536e5797ba550be6e27a95059f1ce53", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.1460872474297755, "ground_truth": 0}, {"key": "c26f356dc536e5797ba550be6e27a95059f1ce53", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.31742629065836, "ground_truth": 0}, {"key": "c26f356dc536e5797ba550be6e27a95059f1ce53", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.2766905200642931, "ground_truth": 0}, {"key": "c26f356dc536e5797ba550be6e27a95059f1ce53", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.3276683000004646, "ground_truth": 0}, {"key": "94a9883a283e94c3ad53069d98517b08e8853447", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.6261241619160549, "ground_truth": 0}, {"key": "94a9883a283e94c3ad53069d98517b08e8853447", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.7620701114809708, "ground_truth": 0}, {"key": "94a9883a283e94c3ad53069d98517b08e8853447", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.5794004212719763, "ground_truth": 0}, {"key": "94a9883a283e94c3ad53069d98517b08e8853447", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.8267117975996012, "ground_truth": 0}, {"key": "94a9883a283e94c3ad53069d98517b08e8853447", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.646013710309008, "ground_truth": 0}, {"key": "9c02ebeda5d84859eb36070de7e8a9517ac3fee6", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.9492946371209527, "ground_truth": 0}, {"key": "9c02ebeda5d84859eb36070de7e8a9517ac3fee6", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.8864204122406277, "ground_truth": 0}, {"key": "9c02ebeda5d84859eb36070de7e8a9517ac3fee6", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.8418256384069371, "ground_truth": 0}, {"key": "9c02ebeda5d84859eb36070de7e8a9517ac3fee6", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.8749346203526334, "ground_truth": 0}, {"key": "9c02ebeda5d84859eb36070de7e8a9517ac3fee6", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.7745833869303839, "ground_truth": 0}, {"key": "37ab3a49bb7732e145a24e70e6f077469ca1dbd3", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.9092645126059627, "ground_truth": 0}, {"key": "37ab3a49bb7732e145a24e70e6f077469ca1dbd3", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.836554567981928, "ground_truth": 0}, {"key": "37ab3a49bb7732e145a24e70e6f077469ca1dbd3", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.8221891296954763, "ground_truth": 0}, {"key": "37ab3a49bb7732e145a24e70e6f077469ca1dbd3", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.8438950996766351, "ground_truth": 0}, {"key": "37ab3a49bb7732e145a24e70e6f077469ca1dbd3", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.9230391603355538, "ground_truth": 0}, {"key": "fa67b52d4597e227947776fd40a4b16f402ed12d", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.821044097504036, "ground_truth": 0}, {"key": "fa67b52d4597e227947776fd40a4b16f402ed12d", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.8031737976933595, "ground_truth": 0}, {"key": "fa67b52d4597e227947776fd40a4b16f402ed12d", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.5058590792133977, "ground_truth": 0}, {"key": "fa67b52d4597e227947776fd40a4b16f402ed12d", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.6370307831728205, "ground_truth": 0}, {"key": "fa67b52d4597e227947776fd40a4b16f402ed12d", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.9012274109487416, "ground_truth": 0}, {"key": "cafb6a9801a85984042abcd7e552d1e129dff4cf", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.5467381569765468, "ground_truth": 0}, {"key": "cafb6a9801a85984042abcd7e552d1e129dff4cf", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.7520125621505419, "ground_truth": 0}, {"key": "cafb6a9801a85984042abcd7e552d1e129dff4cf", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.7008948162553073, "ground_truth": 0}, {"key": "cafb6a9801a85984042abcd7e552d1e129dff4cf", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.675764600009056, "ground_truth": 0}, {"key": "cafb6a9801a85984042abcd7e552d1e129dff4cf", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.6224593197634181, "ground_truth": 0}, {"key": "12a24b1aba082a5fd0687a14015e1e58090ed9c6", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.7416740338498974, "ground_truth": 0}, {"key": "12a24b1aba082a5fd0687a14015e1e58090ed9c6", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.38306416533166865, "ground_truth": 0}, {"key": "12a24b1aba082a5fd0687a14015e1e58090ed9c6", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.7676898446238587, "ground_truth": 0}, {"key": "12a24b1aba082a5fd0687a14015e1e58090ed9c6", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.7446563385291404, "ground_truth": 0}, {"key": "12a24b1aba082a5fd0687a14015e1e58090ed9c6", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.35398626562132735, "ground_truth": 0}, {"key": "c8ebf6f48257a704202c7b6df238bc1cbfa838d7", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.8887587915182417, "ground_truth": 0}, {"key": "c8ebf6f48257a704202c7b6df238bc1cbfa838d7", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.8895288435691746, "ground_truth": 0}, {"key": "c8ebf6f48257a704202c7b6df238bc1cbfa838d7", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.8714748593168264, "ground_truth": 0}, {"key": "c8ebf6f48257a704202c7b6df238bc1cbfa838d7", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.9202179928267389, "ground_truth": 0}, {"key": "c8ebf6f48257a704202c7b6df238bc1cbfa838d7", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.8848377769473841, "ground_truth": 0}, {"key": "48e858dcb8dd62aad328f2c5f7fa052893d7304b", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.4035668240044204, "ground_truth": 0}, {"key": "48e858dcb8dd62aad328f2c5f7fa052893d7304b", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.7295197851157519, "ground_truth": 0}, {"key": "48e858dcb8dd62aad328f2c5f7fa052893d7304b", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.468790620180123, "ground_truth": 0}, {"key": "48e858dcb8dd62aad328f2c5f7fa052893d7304b", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.2613309209927706, "ground_truth": 0}, {"key": "48e858dcb8dd62aad328f2c5f7fa052893d7304b", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.538983229438148, "ground_truth": 0}, {"key": "1522da440cb538c8fc60f254efcb65e8378065a1", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.7446563478901788, "ground_truth": 0}, {"key": "1522da440cb538c8fc60f254efcb65e8378065a1", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.75779436501789, "ground_truth": 0}, {"key": "1522da440cb538c8fc60f254efcb65e8378065a1", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.8428631457673239, "ground_truth": 0}, {"key": "1522da440cb538c8fc60f254efcb65e8378065a1", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.9235923216276045, "ground_truth": 0}, {"key": "1522da440cb538c8fc60f254efcb65e8378065a1", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.7634837576400942, "ground_truth": 0}, {"key": "0b40c6061cfd6a745886150c46eb75a7f43b4efa", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.7490872126889773, "ground_truth": 0}, {"key": "0b40c6061cfd6a745886150c46eb75a7f43b4efa", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.8187367944558895, "ground_truth": 0}, {"key": "0b40c6061cfd6a745886150c46eb75a7f43b4efa", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.8824278652846461, "ground_truth": 0}, {"key": "0b40c6061cfd6a745886150c46eb75a7f43b4efa", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.7772998580136417, "ground_truth": 0}, {"key": "0b40c6061cfd6a745886150c46eb75a7f43b4efa", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.8774767866358616, "ground_truth": 0}, {"key": "730655d5d1f29496344388805a891c3e3fd2a64e", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.7476159594224365, "ground_truth": 0}, {"key": "730655d5d1f29496344388805a891c3e3fd2a64e", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.6601723701950086, "ground_truth": 0}, {"key": "730655d5d1f29496344388805a891c3e3fd2a64e", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.9059898163375255, "ground_truth": 0}, {"key": "730655d5d1f29496344388805a891c3e3fd2a64e", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.762070106542725, "ground_truth": 0}, {"key": "730655d5d1f29496344388805a891c3e3fd2a64e", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.8519528120532864, "ground_truth": 0}, {"key": "399877dd5e90d151e29ad67fdeb6fa093632e0e1", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.5945512654566221, "ground_truth": 0}, {"key": "399877dd5e90d151e29ad67fdeb6fa093632e0e1", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.6477982102785386, "ground_truth": 0}, {"key": "399877dd5e90d151e29ad67fdeb6fa093632e0e1", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.8006919905398713, "ground_truth": 0}, {"key": "399877dd5e90d151e29ad67fdeb6fa093632e0e1", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.6909762907181151, "ground_truth": 0}, {"key": "399877dd5e90d151e29ad67fdeb6fa093632e0e1", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.6424324790143595, "ground_truth": 0}, {"key": "67fc9fa49a2c443dcbab030b9c6247a662716bc9", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.6297746037653363, "ground_truth": 0}, {"key": "67fc9fa49a2c443dcbab030b9c6247a662716bc9", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.5214711696824554, "ground_truth": 0}, {"key": "67fc9fa49a2c443dcbab030b9c6247a662716bc9", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.35577487184293854, "ground_truth": 0}, {"key": "67fc9fa49a2c443dcbab030b9c6247a662716bc9", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.32594952752421635, "ground_truth": 0}, {"key": "67fc9fa49a2c443dcbab030b9c6247a662716bc9", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.7520125657070268, "ground_truth": 0}, {"key": "8a44f223fc67ed0d5f946517f77c2291d6c4a027", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.7520125835160802, "ground_truth": 0}, {"key": "8a44f223fc67ed0d5f946517f77c2291d6c4a027", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.801935826058857, "ground_truth": 0}, {"key": "8a44f223fc67ed0d5f946517f77c2291d6c4a027", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.8519528091178927, "ground_truth": 0}, {"key": "8a44f223fc67ed0d5f946517f77c2291d6c4a027", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.5136684566444765, "ground_truth": 0}, {"key": "8a44f223fc67ed0d5f946517f77c2291d6c4a027", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.7606506379776975, "ground_truth": 0}, {"key": "a3906e4f27942e2742d5cc9a3241980e338e0d30", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.7416740255357404, "ground_truth": 0}, {"key": "a3906e4f27942e2742d5cc9a3241980e338e0d30", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.7264256093171689, "ground_truth": 0}, {"key": "a3906e4f27942e2742d5cc9a3241980e338e0d30", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.7490872194501849, "ground_truth": 0}, {"key": "a3906e4f27942e2742d5cc9a3241980e338e0d30", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.7786493198668732, "ground_truth": 0}, {"key": "a3906e4f27942e2742d5cc9a3241980e338e0d30", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.6757646072976036, "ground_truth": 0}, {"key": "1e9f089602e8ab42ae65e273d866b53bdf9501bc", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.9329437134166205, "ground_truth": 0}, {"key": "1e9f089602e8ab42ae65e273d866b53bdf9501bc", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.8233283919460376, "ground_truth": 0}, {"key": "1e9f089602e8ab42ae65e273d866b53bdf9501bc", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.8344068888036619, "ground_truth": 0}, {"key": "1e9f089602e8ab42ae65e273d866b53bdf9501bc", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.8386797728049739, "ground_truth": 0}, {"key": "1e9f089602e8ab42ae65e273d866b53bdf9501bc", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.9235923207216874, "ground_truth": 0}, {"key": "768682d2f556e103bad77ad7aaa0660181747d1c", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.3647775724171881, "ground_truth": 0}, {"key": "768682d2f556e103bad77ad7aaa0660181747d1c", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.6315942773151603, "ground_truth": 0}, {"key": "768682d2f556e103bad77ad7aaa0660181747d1c", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.4941408978767955, "ground_truth": 0}, {"key": "768682d2f556e103bad77ad7aaa0660181747d1c", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.6150878385125172, "ground_truth": 0}, {"key": "768682d2f556e103bad77ad7aaa0660181747d1c", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.7138307393954173, "ground_truth": 0}, {"key": "2806f716e41ce224a3862eb2bc50e214bc5037d8", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.9178933676839637, "ground_truth": 0}, {"key": "2806f716e41ce224a3862eb2bc50e214bc5037d8", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.8732148249386495, "ground_truth": 0}, {"key": "2806f716e41ce224a3862eb2bc50e214bc5037d8", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.6495786137319323, "ground_truth": 0}, {"key": "2806f716e41ce224a3862eb2bc50e214bc5037d8", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.9019206713123739, "ground_truth": 0}, {"key": "2806f716e41ce224a3862eb2bc50e214bc5037d8", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.8529354709457317, "ground_truth": 0}, {"key": "49d1a193a2c477f5861b593f06681b35b0e49573", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.8354835379198609, "ground_truth": 0}, {"key": "49d1a193a2c477f5861b593f06681b35b0e49573", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.7676898572181218, "ground_truth": 0}, {"key": "49d1a193a2c477f5861b593f06681b35b0e49573", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.822189125859793, "ground_truth": 0}, {"key": "49d1a193a2c477f5861b593f06681b35b0e49573", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.8289388111001252, "ground_truth": 0}, {"key": "49d1a193a2c477f5861b593f06681b35b0e49573", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.881614904171761, "ground_truth": 0}, {"key": "d603649af5260edbbe0474bcbb2e83e7340372d3", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.5097643632856097, "ground_truth": 0}, {"key": "d603649af5260edbbe0474bcbb2e83e7340372d3", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.6619228762306072, "ground_truth": 0}, {"key": "d603649af5260edbbe0474bcbb2e83e7340372d3", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.7122321913052144, "ground_truth": 0}, {"key": "d603649af5260edbbe0474bcbb2e83e7340372d3", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.7461389890212322, "ground_truth": 0}, {"key": "d603649af5260edbbe0474bcbb2e83e7340372d3", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.6261241714274339, "ground_truth": 0}, {"key": "241c3bfcde3e19fb8f0e5d0273ccb06155a2d86b", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.5156199203230216, "ground_truth": 0}, {"key": "241c3bfcde3e19fb8f0e5d0273ccb06155a2d86b", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.4687906412670854, "ground_truth": 0}, {"key": "241c3bfcde3e19fb8f0e5d0273ccb06155a2d86b", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.5350984572597292, "ground_truth": 0}, {"key": "241c3bfcde3e19fb8f0e5d0273ccb06155a2d86b", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.7866228300006078, "ground_truth": 0}, {"key": "241c3bfcde3e19fb8f0e5d0273ccb06155a2d86b", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.4610167398148019, "ground_truth": 0}, {"key": "cc8898d831bb770da703c284d4a811f16cb4035b", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.48047867912210707, "ground_truth": 0}, {"key": "cc8898d831bb770da703c284d4a811f16cb4035b", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.6740504990343678, "ground_truth": 0}, {"key": "cc8898d831bb770da703c284d4a811f16cb4035b", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.3775406485222532, "ground_truth": 0}, {"key": "cc8898d831bb770da703c284d4a811f16cb4035b", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.5409238572569612, "ground_truth": 0}, {"key": "cc8898d831bb770da703c284d4a811f16cb4035b", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.5621764916804648, "ground_truth": 0}, {"key": "e5685719d330bf84ed7691a9a591e04e6a6226b8", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.7279754404273774, "ground_truth": 0}, {"key": "e5685719d330bf84ed7691a9a591e04e6a6226b8", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.7279754152661712, "ground_truth": 0}, {"key": "e5685719d330bf84ed7691a9a591e04e6a6226b8", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.7786492985088621, "ground_truth": 0}, {"key": "e5685719d330bf84ed7691a9a591e04e6a6226b8", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.7310585862730876, "ground_truth": 0}, {"key": "e5685719d330bf84ed7691a9a591e04e6a6226b8", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.8991213809089692, "ground_truth": 0}, {"key": "bc868bcd37d2463875c4c685c582449069992a76", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.7106283090920921, "ground_truth": 0}, {"key": "bc868bcd37d2463875c4c685c582449069992a76", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.6943026826695896, "ground_truth": 0}, {"key": "bc868bcd37d2463875c4c685c582449069992a76", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.7549149718646229, "ground_truth": 0}, {"key": "bc868bcd37d2463875c4c685c582449069992a76", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.8428631404731538, "ground_truth": 0}, {"key": "bc868bcd37d2463875c4c685c582449069992a76", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.6757646119360077, "ground_truth": 0}, {"key": "c6369011986d295ce197e7304e14b207dab4c0aa", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.34158250234510734, "ground_truth": 0}, {"key": "c6369011986d295ce197e7304e14b207dab4c0aa", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.3023910851541653, "ground_truth": 0}, {"key": "c6369011986d295ce197e7304e14b207dab4c0aa", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.583203340361444, "ground_truth": 0}, {"key": "c6369011986d295ce197e7304e14b207dab4c0aa", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.17667161148342003, "ground_truth": 0}, {"key": "c6369011986d295ce197e7304e14b207dab4c0aa", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.6757646165234182, "ground_truth": 0}, {"key": "c4e4f565d15f76b1e367d4fc2e7a2648c3cd395c", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.20434190513633194, "ground_truth": 0}, {"key": "c4e4f565d15f76b1e367d4fc2e7a2648c3cd395c", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.3293917113323002, "ground_truth": 0}, {"key": "c4e4f565d15f76b1e367d4fc2e7a2648c3cd395c", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.09467770045247484, "ground_truth": 0}, {"key": "c4e4f565d15f76b1e367d4fc2e7a2648c3cd395c", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.14223189074914727, "ground_truth": 0}, {"key": "c4e4f565d15f76b1e367d4fc2e7a2648c3cd395c", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.07423136303069539, "ground_truth": 0}, {"key": "32fe9f0f2eedaf63c9fd0314ab92c4b46297e260", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.5, "ground_truth": 0}, {"key": "32fe9f0f2eedaf63c9fd0314ab92c4b46297e260", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.6279512127994912, "ground_truth": 0}, {"key": "32fe9f0f2eedaf63c9fd0314ab92c4b46297e260", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.46490157228888185, "ground_truth": 0}, {"key": "32fe9f0f2eedaf63c9fd0314ab92c4b46297e260", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.5312093730954065, "ground_truth": 0}, {"key": "32fe9f0f2eedaf63c9fd0314ab92c4b46297e260", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.6992544140350911, "ground_truth": 0}, {"key": "41698f361bcf6415f711719ed0c2f6817205c091", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.7799929103797936, "ground_truth": 0}, {"key": "41698f361bcf6415f711719ed0c2f6817205c091", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.857768111211077, "ground_truth": 0}, {"key": "41698f361bcf6415f711719ed0c2f6817205c091", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.8714748627954367, "ground_truth": 0}, {"key": "41698f361bcf6415f711719ed0c2f6817205c091", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.8019358272894703, "ground_truth": 0}, {"key": "41698f361bcf6415f711719ed0c2f6817205c091", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.8652240742774574, "ground_truth": 0}, {"key": "f040d657ee146cd131d34aeb31d6728b4f996666", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.26588046725717707, "ground_truth": 0}, {"key": "f040d657ee146cd131d34aeb31d6728b4f996666", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.21469141468353423, "ground_truth": 0}, {"key": "f040d657ee146cd131d34aeb31d6728b4f996666", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.4921881401150388, "ground_truth": 0}, {"key": "f040d657ee146cd131d34aeb31d6728b4f996666", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.5602526690885352, "ground_truth": 0}, {"key": "f040d657ee146cd131d34aeb31d6728b4f996666", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.390475820904915, "ground_truth": 0}, {"key": "1823e1e750046606e4be0e8710f1d74998783e41", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.6057990404342009, "ground_truth": 0}, {"key": "1823e1e750046606e4be0e8710f1d74998783e41", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.7690802401704377, "ground_truth": 0}, {"key": "1823e1e750046606e4be0e8710f1d74998783e41", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.7905303138671457, "ground_truth": 0}, {"key": "1823e1e750046606e4be0e8710f1d74998783e41", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.8092759803365231, "ground_truth": 0}, {"key": "1823e1e750046606e4be0e8710f1d74998783e41", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.7931059569379463, "ground_truth": 0}, {"key": "6fae638166ee95509fbab3b28ac1c0ba0b088c79", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.6791786843715852, "ground_truth": 0}, {"key": "6fae638166ee95509fbab3b28ac1c0ba0b088c79", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.5964331220673174, "ground_truth": 0}, {"key": "6fae638166ee95509fbab3b28ac1c0ba0b088c79", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.4804786749042824, "ground_truth": 0}, {"key": "6fae638166ee95509fbab3b28ac1c0ba0b088c79", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.43590152219825534, "ground_truth": 0}, {"key": "6fae638166ee95509fbab3b28ac1c0ba0b088c79", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.35398629268292225, "ground_truth": 0}, {"key": "00be40289d0aea65afd2da6431db8a9fc8efc9c0", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.5621764978313039, "ground_truth": 0}, {"key": "00be40289d0aea65afd2da6431db8a9fc8efc9c0", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.6442251136102972, "ground_truth": 0}, {"key": "00be40289d0aea65afd2da6431db8a9fc8efc9c0", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.39606816499392233, "ground_truth": 0}, {"key": "00be40289d0aea65afd2da6431db8a9fc8efc9c0", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.6477982246542099, "ground_truth": 0}, {"key": "00be40289d0aea65afd2da6431db8a9fc8efc9c0", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.4244119896328225, "ground_truth": 0}, {"key": "50dc0ca6cbbd4f9c3761fbb3ad9e7d7ba85bd9b3", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.7476159756097989, "ground_truth": 0}, {"key": "50dc0ca6cbbd4f9c3761fbb3ad9e7d7ba85bd9b3", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.8976953011151165, "ground_truth": 0}, {"key": "50dc0ca6cbbd4f9c3761fbb3ad9e7d7ba85bd9b3", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.6076631645820354, "ground_truth": 0}, {"key": "50dc0ca6cbbd4f9c3761fbb3ad9e7d7ba85bd9b3", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.8774767846921762, "ground_truth": 0}, {"key": "50dc0ca6cbbd4f9c3761fbb3ad9e7d7ba85bd9b3", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.7606506499835545, "ground_truth": 0}, {"key": "28b0e5240a7c3088fc62a70628b146bb40b6b853", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.8832359888875235, "ground_truth": 0}, {"key": "28b0e5240a7c3088fc62a70628b146bb40b6b853", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.9309620701016416, "ground_truth": 0}, {"key": "28b0e5240a7c3088fc62a70628b146bb40b6b853", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.9167080751887885, "ground_truth": 0}, {"key": "28b0e5240a7c3088fc62a70628b146bb40b6b853", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.8365545661564254, "ground_truth": 0}, {"key": "28b0e5240a7c3088fc62a70628b146bb40b6b853", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.9167080691266108, "ground_truth": 0}, {"key": "44bdf9aa9712197110017fca533785653210f1ea", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.8428631468970341, "ground_truth": 0}, {"key": "44bdf9aa9712197110017fca533785653210f1ea", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.8670357601437937, "ground_truth": 0}, {"key": "44bdf9aa9712197110017fca533785653210f1ea", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.786622823756387, "ground_truth": 0}, {"key": "44bdf9aa9712197110017fca533785653210f1ea", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.7461389992563889, "ground_truth": 0}, {"key": "44bdf9aa9712197110017fca533785653210f1ea", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.8140528074937652, "ground_truth": 0}, {"key": "879e68a2b78b3cf3f5c2581bbf6093871143ed7b", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.9324533060391875, "ground_truth": 0}, {"key": "879e68a2b78b3cf3f5c2581bbf6093871143ed7b", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.8438950950949519, "ground_truth": 0}, {"key": "879e68a2b78b3cf3f5c2581bbf6093871143ed7b", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.8872045910496416, "ground_truth": 0}, {"key": "879e68a2b78b3cf3f5c2581bbf6093871143ed7b", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.929440401350313, "ground_truth": 0}, {"key": "879e68a2b78b3cf3f5c2581bbf6093871143ed7b", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.9485372347435607, "ground_truth": 0}, {"key": "980051ddbf137ec06e7aeead2acb598bae388520", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.6757646204694455, "ground_truth": 0}, {"key": "980051ddbf137ec06e7aeead2acb598bae388520", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.8856314805606996, "ground_truth": 0}, {"key": "980051ddbf137ec06e7aeead2acb598bae388520", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.7386690657527055, "ground_truth": 0}, {"key": "980051ddbf137ec06e7aeead2acb598bae388520", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.815232482118237, "ground_truth": 0}, {"key": "980051ddbf137ec06e7aeead2acb598bae388520", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.8577681122865717, "ground_truth": 0}, {"key": "45b9fb89ac2724f2d7de56b2f8c9397bca03326e", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.7295197682532967, "ground_truth": 0}, {"key": "45b9fb89ac2724f2d7de56b2f8c9397bca03326e", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.7704647908096013, "ground_truth": 0}, {"key": "45b9fb89ac2724f2d7de56b2f8c9397bca03326e", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.6095241642619952, "ground_truth": 0}, {"key": "45b9fb89ac2724f2d7de56b2f8c9397bca03326e", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.7138307764629133, "ground_truth": 0}, {"key": "45b9fb89ac2724f2d7de56b2f8c9397bca03326e", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.660172373846159, "ground_truth": 0}, {"key": "b427165e1be5e9b6e6067fc5f6591c02bfb93333", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.4726834717192276, "ground_truth": 0}, {"key": "b427165e1be5e9b6e6067fc5f6591c02bfb93333", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.5195213390873226, "ground_truth": 0}, {"key": "b427165e1be5e9b6e6067fc5f6591c02bfb93333", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.4225046254076408, "ground_truth": 0}, {"key": "b427165e1be5e9b6e6067fc5f6591c02bfb93333", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.5273165307813538, "ground_truth": 0}, {"key": "b427165e1be5e9b6e6067fc5f6591c02bfb93333", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.5273165349407138, "ground_truth": 0}, {"key": "a9a2880bd65c6b3835d19987ebcbd3d09010a0c3", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.5389832552490532, "ground_truth": 0}, {"key": "a9a2880bd65c6b3835d19987ebcbd3d09010a0c3", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.5039061913175511, "ground_truth": 0}, {"key": "a9a2880bd65c6b3835d19987ebcbd3d09010a0c3", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.6388352806535044, "ground_truth": 0}, {"key": "a9a2880bd65c6b3835d19987ebcbd3d09010a0c3", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.5039061878606854, "ground_truth": 0}, {"key": "a9a2880bd65c6b3835d19987ebcbd3d09010a0c3", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.6150878499446432, "ground_truth": 0}, {"key": "0c67e8d5a91f3c7d9c53e29b8d0a25cf8db21b54", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.4130035712385155, "ground_truth": 0}, {"key": "0c67e8d5a91f3c7d9c53e29b8d0a25cf8db21b54", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.700894803703504, "ground_truth": 0}, {"key": "0c67e8d5a91f3c7d9c53e29b8d0a25cf8db21b54", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.5583269831987052, "ground_truth": 0}, {"key": "0c67e8d5a91f3c7d9c53e29b8d0a25cf8db21b54", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.6297746147257794, "ground_truth": 0}, {"key": "0c67e8d5a91f3c7d9c53e29b8d0a25cf8db21b54", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.7534666531211265, "ground_truth": 0}, {"key": "bc1c4d12aabdcecab3d87c6f9a898e41c7cd3821", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.869714567653406, "ground_truth": 0}, {"key": "bc1c4d12aabdcecab3d87c6f9a898e41c7cd3821", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.8519528163329866, "ground_truth": 0}, {"key": "bc1c4d12aabdcecab3d87c6f9a898e41c7cd3821", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.838679760675639, "ground_truth": 0}, {"key": "bc1c4d12aabdcecab3d87c6f9a898e41c7cd3821", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.8187367849558245, "ground_truth": 0}, {"key": "bc1c4d12aabdcecab3d87c6f9a898e41c7cd3821", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.7170118733476408, "ground_truth": 0}, {"key": "7b76a0b5e6006587b65ad70ac2e4953ca1e2d4d1", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.7994423071095973, "ground_truth": 0}, {"key": "7b76a0b5e6006587b65ad70ac2e4953ca1e2d4d1", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.7892337001658731, "ground_truth": 0}, {"key": "7b76a0b5e6006587b65ad70ac2e4953ca1e2d4d1", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.6619228691389665, "ground_truth": 0}, {"key": "7b76a0b5e6006587b65ad70ac2e4953ca1e2d4d1", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.4902356091718107, "ground_truth": 0}, {"key": "7b76a0b5e6006587b65ad70ac2e4953ca1e2d4d1", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.5525397030309442, "ground_truth": 0}, {"key": "8a0976b5b0811c919669e8aed7274e1d0fa14679", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.7122321943549021, "ground_truth": 0}, {"key": "8a0976b5b0811c919669e8aed7274e1d0fa14679", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.6187804225242897, "ground_truth": 0}, {"key": "8a0976b5b0811c919669e8aed7274e1d0fa14679", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.33633104922310214, "ground_truth": 0}, {"key": "8a0976b5b0811c919669e8aed7274e1d0fa14679", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.45519860989187927, "ground_truth": 0}, {"key": "8a0976b5b0811c919669e8aed7274e1d0fa14679", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.3998116525532913, "ground_truth": 0}, {"key": "69788d586d71bf36d2818ca097308747f6ab25ab", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.7718435025541922, "ground_truth": 0}, {"key": "69788d586d71bf36d2818ca097308747f6ab25ab", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.7074046846272222, "ground_truth": 0}, {"key": "69788d586d71bf36d2818ca097308747f6ab25ab", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.49414089684161616, "ground_truth": 0}, {"key": "69788d586d71bf36d2818ca097308747f6ab25ab", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.5926665974385856, "ground_truth": 0}, {"key": "69788d586d71bf36d2818ca097308747f6ab25ab", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.7090191383642155, "ground_truth": 0}, {"key": "82e9c77478dfed129ceca1a152ba54e20f7f5a88", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.778649318653198, "ground_truth": 0}, {"key": "82e9c77478dfed129ceca1a152ba54e20f7f5a88", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.6169358067529694, "ground_truth": 0}, {"key": "82e9c77478dfed129ceca1a152ba54e20f7f5a88", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.7549150001151904, "ground_truth": 0}, {"key": "82e9c77478dfed129ceca1a152ba54e20f7f5a88", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.6774740083756797, "ground_truth": 0}, {"key": "82e9c77478dfed129ceca1a152ba54e20f7f5a88", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.8116760046921095, "ground_truth": 0}, {"key": "e1b904fd0a3f74c3e01831acb6d4a67c0d1b642b", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.5602526798408313, "ground_truth": 0}, {"key": "e1b904fd0a3f74c3e01831acb6d4a67c0d1b642b", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.6513548556200727, "ground_truth": 0}, {"key": "e1b904fd0a3f74c3e01831acb6d4a67c0d1b642b", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.62795120383207, "ground_truth": 0}, {"key": "e1b904fd0a3f74c3e01831acb6d4a67c0d1b642b", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.5097643815707027, "ground_truth": 0}, {"key": "e1b904fd0a3f74c3e01831acb6d4a67c0d1b642b", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.6495786290320749, "ground_truth": 0}, {"key": "1cecb5f24805afcc15eb5cfa0500130f107c8bcb", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.3276682806599455, "ground_truth": 0}, {"key": "1cecb5f24805afcc15eb5cfa0500130f107c8bcb", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.27669054821190914, "ground_truth": 0}, {"key": "1cecb5f24805afcc15eb5cfa0500130f107c8bcb", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.265880486403237, "ground_truth": 0}, {"key": "1cecb5f24805afcc15eb5cfa0500130f107c8bcb", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.2720245315319592, "ground_truth": 0}, {"key": "1cecb5f24805afcc15eb5cfa0500130f107c8bcb", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.5331544244148713, "ground_truth": 0}, {"key": "d3da69405b687367de6260d74db8726423b6884a", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.8031737983069251, "ground_truth": 0}, {"key": "d3da69405b687367de6260d74db8726423b6884a", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.8998277788841998, "ground_truth": 0}, {"key": "d3da69405b687367de6260d74db8726423b6884a", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.5156199136788976, "ground_truth": 0}, {"key": "d3da69405b687367de6260d74db8726423b6884a", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.646013695479487, "ground_truth": 0}, {"key": "d3da69405b687367de6260d74db8726423b6884a", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.8289388172151977, "ground_truth": 0}, {"key": "9b7836ba179053fecec671168589694bd4ba08f1", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.8832359894998646, "ground_truth": 0}, {"key": "9b7836ba179053fecec671168589694bd4ba08f1", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.8140528087887676, "ground_truth": 0}, {"key": "9b7836ba179053fecec671168589694bd4ba08f1", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.8438950959350878, "ground_truth": 0}, {"key": "9b7836ba179053fecec671168589694bd4ba08f1", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.8006919876660143, "ground_truth": 0}, {"key": "9b7836ba179053fecec671168589694bd4ba08f1", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.7879311946644342, "ground_truth": 0}, {"key": "9483ae6d83dd71a96e91eee727a9ce7c0f3cf6ab", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.9759464473266968, "ground_truth": 0}, {"key": "9483ae6d83dd71a96e91eee727a9ce7c0f3cf6ab", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.9676556691332985, "ground_truth": 0}, {"key": "9483ae6d83dd71a96e91eee727a9ce7c0f3cf6ab", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.9492946355121061, "ground_truth": 0}, {"key": "9483ae6d83dd71a96e91eee727a9ce7c0f3cf6ab", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.9844563515276264, "ground_truth": 0}, {"key": "9483ae6d83dd71a96e91eee727a9ce7c0f3cf6ab", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.9645892685782658, "ground_truth": 0}, {"key": "ea29e498c303964fc39c856ddf7037d5dfbc93fb", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.4205995873542133, "ground_truth": 0}, {"key": "ea29e498c303964fc39c856ddf7037d5dfbc93fb", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.4804786614897696, "ground_truth": 0}, {"key": "ea29e498c303964fc39c856ddf7037d5dfbc93fb", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.5506073485892655, "ground_truth": 0}, {"key": "ea29e498c303964fc39c856ddf7037d5dfbc93fb", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.40544871063727667, "ground_truth": 0}, {"key": "ea29e498c303964fc39c856ddf7037d5dfbc93fb", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.4455295284380832, "ground_truth": 0}, {"key": "e1aad9da59a32a4443010b092eba1b68725c8467", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.7853085597852544, "ground_truth": 0}, {"key": "e1aad9da59a32a4443010b092eba1b68725c8467", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.8221891255192474, "ground_truth": 0}, {"key": "e1aad9da59a32a4443010b092eba1b68725c8467", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.39420095967887037, "ground_truth": 0}, {"key": "e1aad9da59a32a4443010b092eba1b68725c8467", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.750552771815968, "ground_truth": 0}, {"key": "e1aad9da59a32a4443010b092eba1b68725c8467", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.8104789071402, "ground_truth": 0}, {"key": "6897f34c8e510dc95524dbfceefe20717776f761", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.762070102751531, "ground_truth": 0}, {"key": "6897f34c8e510dc95524dbfceefe20717776f761", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.6242935188839067, "ground_truth": 0}, {"key": "6897f34c8e510dc95524dbfceefe20717776f761", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.42250461595570976, "ground_truth": 0}, {"key": "6897f34c8e510dc95524dbfceefe20717776f761", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.7956580867298828, "ground_truth": 0}, {"key": "6897f34c8e510dc95524dbfceefe20717776f761", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.6531269220139196, "ground_truth": 0}, {"key": "c0846f0148c9fd60433c8d2bf85e3437b49f9ec4", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.6688802411930975, "ground_truth": 0}, {"key": "c0846f0148c9fd60433c8d2bf85e3437b49f9ec4", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.8267117795530055, "ground_truth": 0}, {"key": "c0846f0148c9fd60433c8d2bf85e3437b49f9ec4", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.7563575592525068, "ground_truth": 0}, {"key": "c0846f0148c9fd60433c8d2bf85e3437b49f9ec4", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.7620701151719118, "ground_truth": 0}, {"key": "c0846f0148c9fd60433c8d2bf85e3437b49f9ec4", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.6548947418291441, "ground_truth": 0}, {"key": "dfbb5a2d5844f89537141a2b5a48040e68327010", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.7879311903603268, "ground_truth": 0}, {"key": "dfbb5a2d5844f89537141a2b5a48040e68327010", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.6706082835114443, "ground_truth": 0}, {"key": "dfbb5a2d5844f89537141a2b5a48040e68327010", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.7892337127487594, "ground_truth": 0}, {"key": "dfbb5a2d5844f89537141a2b5a48040e68327010", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.7476159563189576, "ground_truth": 0}, {"key": "dfbb5a2d5844f89537141a2b5a48040e68327010", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.8233283867009791, "ground_truth": 0}, {"key": "0aa0562353120d93357dc00a05ff4d2bc0312715", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.5448013894805833, "ground_truth": 0}, {"key": "0aa0562353120d93357dc00a05ff4d2bc0312715", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.43206335860236733, "ground_truth": 0}, {"key": "0aa0562353120d93357dc00a05ff4d2bc0312715", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.4016878025381147, "ground_truth": 0}, {"key": "0aa0562353120d93357dc00a05ff4d2bc0312715", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.6001883334737115, "ground_truth": 0}, {"key": "0aa0562353120d93357dc00a05ff4d2bc0312715", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.5563995859648595, "ground_truth": 0}, {"key": "fd5ae29a3ed2e9093c12dcbb12fcb5c67217b0f5", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.5544704714826553, "ground_truth": 0}, {"key": "fd5ae29a3ed2e9093c12dcbb12fcb5c67217b0f5", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.5621765017667668, "ground_truth": 0}, {"key": "fd5ae29a3ed2e9093c12dcbb12fcb5c67217b0f5", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.5292634012474978, "ground_truth": 0}, {"key": "fd5ae29a3ed2e9093c12dcbb12fcb5c67217b0f5", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.5, "ground_truth": 0}, {"key": "fd5ae29a3ed2e9093c12dcbb12fcb5c67217b0f5", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.5312093841065565, "ground_truth": 0}, {"key": "4df7a53f5e24347a53d5bf3b8c92bef21561f2c4", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.5078118533405027, "ground_truth": 0}, {"key": "4df7a53f5e24347a53d5bf3b8c92bef21561f2c4", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.6460136993282004, "ground_truth": 0}, {"key": "4df7a53f5e24347a53d5bf3b8c92bef21561f2c4", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.6774740335321204, "ground_truth": 0}, {"key": "4df7a53f5e24347a53d5bf3b8c92bef21561f2c4", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.585101162983357, "ground_truth": 0}, {"key": "4df7a53f5e24347a53d5bf3b8c92bef21561f2c4", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.5679366504341118, "ground_truth": 0}, {"key": "166fe0c3d3f400a48ec5fd716c675384512f152c", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.4167966484115999, "ground_truth": 0}, {"key": "166fe0c3d3f400a48ec5fd716c675384512f152c", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.49804689916862455, "ground_truth": 0}, {"key": "166fe0c3d3f400a48ec5fd716c675384512f152c", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.32082130871791986, "ground_truth": 0}, {"key": "166fe0c3d3f400a48ec5fd716c675384512f152c", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.2798284965100035, "ground_truth": 0}, {"key": "166fe0c3d3f400a48ec5fd716c675384512f152c", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.5350984250319213, "ground_truth": 0}, {"key": "69e313e0e6e7603f96a3783cb7d1ada68ace288f", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.9518632275912445, "ground_truth": 0}, {"key": "69e313e0e6e7603f96a3783cb7d1ada68ace288f", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.7981867756982176, "ground_truth": 0}, {"key": "69e313e0e6e7603f96a3783cb7d1ada68ace288f", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.8832359852796579, "ground_truth": 0}, {"key": "69e313e0e6e7603f96a3783cb7d1ada68ace288f", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.8824278633040316, "ground_truth": 0}, {"key": "69e313e0e6e7603f96a3783cb7d1ada68ace288f", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.747615972044442, "ground_truth": 0}, {"key": "21ff7b91537b3ab2e73dff1f982a669b8658b0e9", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.7041601605392052, "ground_truth": 0}, {"key": "21ff7b91537b3ab2e73dff1f982a669b8658b0e9", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.626124188462486, "ground_truth": 0}, {"key": "21ff7b91537b3ab2e73dff1f982a669b8658b0e9", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.8469578551786636, "ground_truth": 0}, {"key": "21ff7b91537b3ab2e73dff1f982a669b8658b0e9", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.7956581190566292, "ground_truth": 0}, {"key": "21ff7b91537b3ab2e73dff1f982a669b8658b0e9", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.7295197863987956, "ground_truth": 0}, {"key": "963cbc7820b42eaa7b7a82d178c6a387a70a6a3c", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.7431680099270155, "ground_truth": 0}, {"key": "963cbc7820b42eaa7b7a82d178c6a387a70a6a3c", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.7981867696674998, "ground_truth": 0}, {"key": "963cbc7820b42eaa7b7a82d178c6a387a70a6a3c", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.665410564047284, "ground_truth": 0}, {"key": "963cbc7820b42eaa7b7a82d178c6a387a70a6a3c", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.871474858817063, "ground_truth": 0}, {"key": "963cbc7820b42eaa7b7a82d178c6a387a70a6a3c", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.8221891385778403, "ground_truth": 0}, {"key": "8180a77657661e975e3fac6c7fdbd8de97fd160e", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.9626731106110601, "ground_truth": 0}, {"key": "8180a77657661e975e3fac6c7fdbd8de97fd160e", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.8947894649841757, "ground_truth": 0}, {"key": "8180a77657661e975e3fac6c7fdbd8de97fd160e", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.8955226819373203, "ground_truth": 0}, {"key": "8180a77657661e975e3fac6c7fdbd8de97fd160e", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.8376199587311407, "ground_truth": 0}, {"key": "8180a77657661e975e3fac6c7fdbd8de97fd160e", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.8848377771349991, "ground_truth": 0}, {"key": "6c498fd6de7ad5e5006732655050c1d97cc2af68", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.4941408970899217, "ground_truth": 0}, {"key": "6c498fd6de7ad5e5006732655050c1d97cc2af68", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.5563995789166003, "ground_truth": 0}, {"key": "6c498fd6de7ad5e5006732655050c1d97cc2af68", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.32082131962419186, "ground_truth": 0}, {"key": "6c498fd6de7ad5e5006732655050c1d97cc2af68", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.42823342406445714, "ground_truth": 0}, {"key": "6c498fd6de7ad5e5006732655050c1d97cc2af68", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.25683200637107795, "ground_truth": 0}, {"key": "fdb54e157f8f4e5a479dbc6288587e52fffde33f", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.5331544000333022, "ground_truth": 0}, {"key": "fdb54e157f8f4e5a479dbc6288587e52fffde33f", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.46684556844506964, "ground_truth": 0}, {"key": "fdb54e157f8f4e5a479dbc6288587e52fffde33f", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.6315943218604886, "ground_truth": 0}, {"key": "fdb54e157f8f4e5a479dbc6288587e52fffde33f", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.6636689400469394, "ground_truth": 0}, {"key": "fdb54e157f8f4e5a479dbc6288587e52fffde33f", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.5428632655774812, "ground_truth": 0}, {"key": "fc8f0e54e2627ebe705735f0565d77ca64579d92", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.5156199200287036, "ground_truth": 0}, {"key": "fc8f0e54e2627ebe705735f0565d77ca64579d92", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.5945512748977216, "ground_truth": 0}, {"key": "fc8f0e54e2627ebe705735f0565d77ca64579d92", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.4726834820919486, "ground_truth": 0}, {"key": "fc8f0e54e2627ebe705735f0565d77ca64579d92", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.8322366462531708, "ground_truth": 0}, {"key": "fc8f0e54e2627ebe705735f0565d77ca64579d92", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.6424324587269887, "ground_truth": 0}, {"key": "b000d4eac990440e136dc1e655a03d5669531d9b", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.6242935114435831, "ground_truth": 0}, {"key": "b000d4eac990440e136dc1e655a03d5669531d9b", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.2798284860754881, "ground_truth": 0}, {"key": "b000d4eac990440e136dc1e655a03d5669531d9b", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.6388352970158586, "ground_truth": 0}, {"key": "b000d4eac990440e136dc1e655a03d5669531d9b", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.40168781922109864, "ground_truth": 0}, {"key": "b000d4eac990440e136dc1e655a03d5669531d9b", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.5467381676351472, "ground_truth": 0}, {"key": "1064c47f3d7f0efa03368fe7eb01dd0836017339", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.6876299976387322, "ground_truth": 0}, {"key": "1064c47f3d7f0efa03368fe7eb01dd0836017339", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.6992544193828822, "ground_truth": 0}, {"key": "1064c47f3d7f0efa03368fe7eb01dd0836017339", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.6187804253389115, "ground_truth": 0}, {"key": "1064c47f3d7f0efa03368fe7eb01dd0836017339", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.6315942959678295, "ground_truth": 0}, {"key": "1064c47f3d7f0efa03368fe7eb01dd0836017339", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.461016781844217, "ground_truth": 0}, {"key": "d79f1e9a2ddfcb61d80c944de53daebd4b5c7f6e", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.34334170369689304, "ground_truth": 0}, {"key": "d79f1e9a2ddfcb61d80c944de53daebd4b5c7f6e", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.7185943796028182, "ground_truth": 0}, {"key": "d79f1e9a2ddfcb61d80c944de53daebd4b5c7f6e", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.6513548570729057, "ground_truth": 0}, {"key": "d79f1e9a2ddfcb61d80c944de53daebd4b5c7f6e", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.3738758128833074, "ground_truth": 0}, {"key": "d79f1e9a2ddfcb61d80c944de53daebd4b5c7f6e", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.6132365559430626, "ground_truth": 0}, {"key": "87b5f1f872c849ec239bad4ccf487d048d4274b2", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.756357545494565, "ground_truth": 0}, {"key": "87b5f1f872c849ec239bad4ccf487d048d4274b2", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.7969253657428359, "ground_truth": 0}, {"key": "87b5f1f872c849ec239bad4ccf487d048d4274b2", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.8864204082201407, "ground_truth": 0}, {"key": "87b5f1f872c849ec239bad4ccf487d048d4274b2", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.8210441007831838, "ground_truth": 0}, {"key": "87b5f1f872c849ec239bad4ccf487d048d4274b2", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.7981867834326746, "ground_truth": 0}, {"key": "9ea6d6a5cae86243c1c8899f7bab76e874c73b38", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.6297746087341418, "ground_truth": 0}, {"key": "9ea6d6a5cae86243c1c8899f7bab76e874c73b38", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.6020615882382934, "ground_truth": 0}, {"key": "9ea6d6a5cae86243c1c8899f7bab76e874c73b38", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.4590761128921553, "ground_truth": 0}, {"key": "9ea6d6a5cae86243c1c8899f7bab76e874c73b38", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.7431680058782082, "ground_truth": 0}, {"key": "9ea6d6a5cae86243c1c8899f7bab76e874c73b38", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.6757645936422912, "ground_truth": 0}, {"key": "a3cb529364dbdcd2af9e30ecfe56898be375870b", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.3398275919387459, "ground_truth": 0}, {"key": "a3cb529364dbdcd2af9e30ecfe56898be375870b", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.4687906474206037, "ground_truth": 0}, {"key": "a3cb529364dbdcd2af9e30ecfe56898be375870b", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.503906172211802, "ground_truth": 0}, {"key": "a3cb529364dbdcd2af9e30ecfe56898be375870b", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.5621764998776021, "ground_truth": 0}, {"key": "a3cb529364dbdcd2af9e30ecfe56898be375870b", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.5136685201388794, "ground_truth": 0}, {"key": "f489b07406c653968a0ed21c00e28c9124e4a49b", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.9358173530522954, "ground_truth": 0}, {"key": "f489b07406c653968a0ed21c00e28c9124e4a49b", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.8606036139202485, "ground_truth": 0}, {"key": "f489b07406c653968a0ed21c00e28c9124e4a49b", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.9343951555299287, "ground_truth": 0}, {"key": "f489b07406c653968a0ed21c00e28c9124e4a49b", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.9489172647187315, "ground_truth": 0}, {"key": "f489b07406c653968a0ed21c00e28c9124e4a49b", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.8596637440195597, "ground_truth": 0}, {"key": "499fdb9bf024f6fbfd605792594372df22ec12f0", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.3849121656850554, "ground_truth": 0}, {"key": "499fdb9bf024f6fbfd605792594372df22ec12f0", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.4882833877309575, "ground_truth": 0}, {"key": "499fdb9bf024f6fbfd605792594372df22ec12f0", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.5389832131496108, "ground_truth": 0}, {"key": "499fdb9bf024f6fbfd605792594372df22ec12f0", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.6791786819547647, "ground_truth": 0}, {"key": "499fdb9bf024f6fbfd605792594372df22ec12f0", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.43590152472798127, "ground_truth": 0}, {"key": "9f49bf7ded4308f1601e4723d594d7c3b4883b32", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.8947894614213892, "ground_truth": 0}, {"key": "9f49bf7ded4308f1601e4723d594d7c3b4883b32", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.833324596749181, "ground_truth": 0}, {"key": "9f49bf7ded4308f1601e4723d594d7c3b4883b32", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.7170118845141356, "ground_truth": 0}, {"key": "9f49bf7ded4308f1601e4723d594d7c3b4883b32", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.8933094107041825, "ground_truth": 0}, {"key": "9f49bf7ded4308f1601e4723d594d7c3b4883b32", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.9073122182336849, "ground_truth": 0}, {"key": "6bd843fe975d42b0f2d5eedb1a02d918e4a397f5", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.7341195324581159, "ground_truth": 0}, {"key": "6bd843fe975d42b0f2d5eedb1a02d918e4a397f5", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.8092759762684761, "ground_truth": 0}, {"key": "6bd843fe975d42b0f2d5eedb1a02d918e4a397f5", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.6825737502731213, "ground_truth": 0}, {"key": "6bd843fe975d42b0f2d5eedb1a02d918e4a397f5", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.8824278643043684, "ground_truth": 0}, {"key": "6bd843fe975d42b0f2d5eedb1a02d918e4a397f5", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.8984105459568318, "ground_truth": 0}, {"key": "00aa8e3ba59f5fe71a096a5549f80faece10aa83", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.7879311959222479, "ground_truth": 0}, {"key": "00aa8e3ba59f5fe71a096a5549f80faece10aa83", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.8816149046984106, "ground_truth": 0}, {"key": "00aa8e3ba59f5fe71a096a5549f80faece10aa83", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.672331691412088, "ground_truth": 0}, {"key": "00aa8e3ba59f5fe71a096a5549f80faece10aa83", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.6039318472594271, "ground_truth": 0}, {"key": "00aa8e3ba59f5fe71a096a5549f80faece10aa83", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.6723316829925722, "ground_truth": 0}, {"key": "bf0ea0373655184f69fb01b9aa833d21e7188e9e", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.45907613077574194, "ground_truth": 0}, {"key": "bf0ea0373655184f69fb01b9aa833d21e7188e9e", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.39793841867486557, "ground_truth": 0}, {"key": "bf0ea0373655184f69fb01b9aa833d21e7188e9e", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.6513548473728674, "ground_truth": 0}, {"key": "bf0ea0373655184f69fb01b9aa833d21e7188e9e", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.5331544014735151, "ground_truth": 0}, {"key": "bf0ea0373655184f69fb01b9aa833d21e7188e9e", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.4902356067561356, "ground_truth": 0}, {"key": "e1afe080ecf3565b0103214c21f49e8b03741024", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.5755879938267117, "ground_truth": 0}, {"key": "e1afe080ecf3565b0103214c21f49e8b03741024", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.7106283020699848, "ground_truth": 0}, {"key": "e1afe080ecf3565b0103214c21f49e8b03741024", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.6334102567701786, "ground_truth": 0}, {"key": "e1afe080ecf3565b0103214c21f49e8b03741024", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.7325918232076444, "ground_truth": 0}, {"key": "e1afe080ecf3565b0103214c21f49e8b03741024", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.6261241843509858, "ground_truth": 0}, {"key": "05fa6152f08a3d64745030124428775768ee3afd", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.5195213419573196, "ground_truth": 0}, {"key": "05fa6152f08a3d64745030124428775768ee3afd", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.8624675287575903, "ground_truth": 0}, {"key": "05fa6152f08a3d64745030124428775768ee3afd", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.7732163703955571, "ground_truth": 0}, {"key": "05fa6152f08a3d64745030124428775768ee3afd", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.7341195273740424, "ground_truth": 0}, {"key": "05fa6152f08a3d64745030124428775768ee3afd", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.5869964259868125, "ground_truth": 0}, {"key": "8f80054060e5c2dde57666b5e3bddf6b70b34f3f", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.6757645823944063, "ground_truth": 0}, {"key": "8f80054060e5c2dde57666b5e3bddf6b70b34f3f", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.6477982149323438, "ground_truth": 0}, {"key": "8f80054060e5c2dde57666b5e3bddf6b70b34f3f", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.6740504949478618, "ground_truth": 0}, {"key": "8f80054060e5c2dde57666b5e3bddf6b70b34f3f", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.786622825052274, "ground_truth": 0}, {"key": "8f80054060e5c2dde57666b5e3bddf6b70b34f3f", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.43014736000668463, "ground_truth": 0}, {"key": "f63877ffefceaf9a2a13a9277f4d861f9b9b8a73", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.7386690663567749, "ground_truth": 0}, {"key": "f63877ffefceaf9a2a13a9277f4d861f9b9b8a73", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.5945512785893795, "ground_truth": 0}, {"key": "f63877ffefceaf9a2a13a9277f4d861f9b9b8a73", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.6757645749625611, "ground_truth": 0}, {"key": "f63877ffefceaf9a2a13a9277f4d861f9b9b8a73", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.6706082972783303, "ground_truth": 0}, {"key": "f63877ffefceaf9a2a13a9277f4d861f9b9b8a73", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.6601723745392921, "ground_truth": 0}, {"key": "e1e0fbee1f5df559fda3830710afb660f33cb7b5", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.5640984671369975, "ground_truth": 0}, {"key": "e1e0fbee1f5df559fda3830710afb660f33cb7b5", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.4882834035271962, "ground_truth": 0}, {"key": "e1e0fbee1f5df559fda3830710afb660f33cb7b5", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.4493926241990568, "ground_truth": 0}, {"key": "e1e0fbee1f5df559fda3830710afb660f33cb7b5", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.7170118760150718, "ground_truth": 0}, {"key": "e1e0fbee1f5df559fda3830710afb660f33cb7b5", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.6774740389130522, "ground_truth": 0}, {"key": "7d66246dc75062c5616067bbb379962c3934e52f", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.6370307995420827, "ground_truth": 0}, {"key": "7d66246dc75062c5616067bbb379962c3934e52f", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.6406358593583386, "ground_truth": 0}, {"key": "7d66246dc75062c5616067bbb379962c3934e52f", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.40544871288204065, "ground_truth": 0}, {"key": "7d66246dc75062c5616067bbb379962c3934e52f", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.27202456108842726, "ground_truth": 0}, {"key": "7d66246dc75062c5616067bbb379962c3934e52f", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.32423538753303965, "ground_truth": 0}, {"key": "09e62b334425ef4eee26be483a625858c91340eb", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.5621765081382718, "ground_truth": 0}, {"key": "09e62b334425ef4eee26be483a625858c91340eb", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.7057850267305619, "ground_truth": 0}, {"key": "09e62b334425ef4eee26be483a625858c91340eb", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.6297745796092761, "ground_truth": 0}, {"key": "09e62b334425ef4eee26be483a625858c91340eb", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.6039318458365444, "ground_truth": 0}, {"key": "09e62b334425ef4eee26be483a625858c91340eb", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.7577943654008922, "ground_truth": 0}, {"key": "32e769b0ced3ffbf79f695af69a2401897156c8c", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.550607367643706, "ground_truth": 0}, {"key": "32e769b0ced3ffbf79f695af69a2401897156c8c", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.4111108590633501, "ground_truth": 0}, {"key": "32e769b0ced3ffbf79f695af69a2401897156c8c", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.6001883483003199, "ground_truth": 0}, {"key": "32e769b0ced3ffbf79f695af69a2401897156c8c", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.6242935256260211, "ground_truth": 0}, {"key": "32e769b0ced3ffbf79f695af69a2401897156c8c", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.5195213349563031, "ground_truth": 0}, {"key": "43d42fe40ada4406377bc3b45c123a75552c21a0", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.40922079444453946, "ground_truth": 0}, {"key": "43d42fe40ada4406377bc3b45c123a75552c21a0", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.6187804320225742, "ground_truth": 0}, {"key": "43d42fe40ada4406377bc3b45c123a75552c21a0", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.37022537411309453, "ground_truth": 0}, {"key": "43d42fe40ada4406377bc3b45c123a75552c21a0", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.7866228268376089, "ground_truth": 0}, {"key": "43d42fe40ada4406377bc3b45c123a75552c21a0", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.35756751522148383, "ground_truth": 0}, {"key": "cec3e977a612e1481913d63934cfe578b9bcf3be", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.6566582606129491, "ground_truth": 0}, {"key": "cec3e977a612e1481913d63934cfe578b9bcf3be", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.6150878307028472, "ground_truth": 0}, {"key": "cec3e977a612e1481913d63934cfe578b9bcf3be", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.5945512557611725, "ground_truth": 0}, {"key": "cec3e977a612e1481913d63934cfe578b9bcf3be", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.6370308209814275, "ground_truth": 0}, {"key": "cec3e977a612e1481913d63934cfe578b9bcf3be", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.44167301527242186, "ground_truth": 0}, {"key": "2572185d9544f23c4ad02aeac1ae8ab7828fb4be", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.8116760257842258, "ground_truth": 0}, {"key": "2572185d9544f23c4ad02aeac1ae8ab7828fb4be", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.8824278636843826, "ground_truth": 0}, {"key": "2572185d9544f23c4ad02aeac1ae8ab7828fb4be", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.7981867841816128, "ground_truth": 0}, {"key": "2572185d9544f23c4ad02aeac1ae8ab7828fb4be", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.6297745949933627, "ground_truth": 0}, {"key": "2572185d9544f23c4ad02aeac1ae8ab7828fb4be", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.8210441106809225, "ground_truth": 0}, {"key": "3cc7c9639fb87922cfac315fbb55641e671a3d99", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.5679366234911423, "ground_truth": 0}, {"key": "3cc7c9639fb87922cfac315fbb55641e671a3d99", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.5, "ground_truth": 0}, {"key": "3cc7c9639fb87922cfac315fbb55641e671a3d99", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.5, "ground_truth": 0}, {"key": "3cc7c9639fb87922cfac315fbb55641e671a3d99", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.624293521276851, "ground_truth": 0}, {"key": "3cc7c9639fb87922cfac315fbb55641e671a3d99", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.6352224374483555, "ground_truth": 0}, {"key": "374ae10f9cbb0719c889321f880a0671892336e4", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.6808786397524628, "ground_truth": 0}, {"key": "374ae10f9cbb0719c889321f880a0671892336e4", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.8757869941765256, "ground_truth": 0}, {"key": "374ae10f9cbb0719c889321f880a0671892336e4", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.7879311995050051, "ground_truth": 0}, {"key": "374ae10f9cbb0719c889321f880a0671892336e4", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.6791787009009027, "ground_truth": 0}, {"key": "374ae10f9cbb0719c889321f880a0671892336e4", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.7994423171746813, "ground_truth": 0}, {"key": "89a7bb5a0b120c5b50e9145c8f8f9bea3a90371a", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.7520125703485708, "ground_truth": 0}, {"key": "89a7bb5a0b120c5b50e9145c8f8f9bea3a90371a", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.6566582573696736, "ground_truth": 0}, {"key": "89a7bb5a0b120c5b50e9145c8f8f9bea3a90371a", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.7154239938741507, "ground_truth": 0}, {"key": "89a7bb5a0b120c5b50e9145c8f8f9bea3a90371a", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.867933845035676, "ground_truth": 0}, {"key": "89a7bb5a0b120c5b50e9145c8f8f9bea3a90371a", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.760650649772715, "ground_truth": 0}, {"key": "49d4ad731a44b7576e3e3271b1eee2f0219883c2", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.6187804243285963, "ground_truth": 0}, {"key": "49d4ad731a44b7576e3e3271b1eee2f0219883c2", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.8289388170699148, "ground_truth": 0}, {"key": "49d4ad731a44b7576e3e3271b1eee2f0219883c2", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.8824278638284292, "ground_truth": 0}, {"key": "49d4ad731a44b7576e3e3271b1eee2f0219883c2", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.839733966162379, "ground_truth": 0}, {"key": "49d4ad731a44b7576e3e3271b1eee2f0219883c2", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.8577681044960878, "ground_truth": 0}, {"key": "ab3c9bac8bcfef89da719c4aba8ea4eee71e4daf", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.7341195257068025, "ground_truth": 0}, {"key": "ab3c9bac8bcfef89da719c4aba8ea4eee71e4daf", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.7943849588021941, "ground_truth": 0}, {"key": "ab3c9bac8bcfef89da719c4aba8ea4eee71e4daf", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.7446563562966597, "ground_truth": 0}, {"key": "ab3c9bac8bcfef89da719c4aba8ea4eee71e4daf", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.8080672079296534, "ground_truth": 0}, {"key": "ab3c9bac8bcfef89da719c4aba8ea4eee71e4daf", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.7138307443832483, "ground_truth": 0}, {"key": "eb8b1cf7cf4ab7ad23ef6094cfe69348563aecc8", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.5389832120364619, "ground_truth": 0}, {"key": "eb8b1cf7cf4ab7ad23ef6094cfe69348563aecc8", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.679178679731972, "ground_truth": 0}, {"key": "eb8b1cf7cf4ab7ad23ef6094cfe69348563aecc8", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.6206215994747295, "ground_truth": 0}, {"key": "eb8b1cf7cf4ab7ad23ef6094cfe69348563aecc8", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.7122321907377581, "ground_truth": 0}, {"key": "eb8b1cf7cf4ab7ad23ef6094cfe69348563aecc8", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.6619228611399486, "ground_truth": 0}, {"key": "e944a5cbd4265e43f422c172b930a60b7de190cc", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.3415825010840675, "ground_truth": 0}, {"key": "e944a5cbd4265e43f422c172b930a60b7de190cc", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.40168780367751367, "ground_truth": 0}, {"key": "e944a5cbd4265e43f422c172b930a60b7de190cc", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.1530421537435281, "ground_truth": 0}, {"key": "e944a5cbd4265e43f422c172b930a60b7de190cc", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.13568954625100066, "ground_truth": 0}, {"key": "e944a5cbd4265e43f422c172b930a60b7de190cc", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.32252600067132214, "ground_truth": 0}, {"key": "ef96a6c54daaf4fef676a69305e26fa1d4788bdd", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.7041601231872658, "ground_truth": 0}, {"key": "ef96a6c54daaf4fef676a69305e26fa1d4788bdd", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.7461389952204108, "ground_truth": 0}, {"key": "ef96a6c54daaf4fef676a69305e26fa1d4788bdd", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.6992544157211685, "ground_truth": 0}, {"key": "ef96a6c54daaf4fef676a69305e26fa1d4788bdd", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.618780439044715, "ground_truth": 0}, {"key": "ef96a6c54daaf4fef676a69305e26fa1d4788bdd", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.5755880126348951, "ground_truth": 0}, {"key": "d9ec8c3e50de1d5af4524c26c6819e17b64090aa", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.3757064669046606, "ground_truth": 0}, {"key": "d9ec8c3e50de1d5af4524c26c6819e17b64090aa", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.4282333794708553, "ground_truth": 0}, {"key": "d9ec8c3e50de1d5af4524c26c6819e17b64090aa", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.3979383976481694, "ground_truth": 0}, {"key": "d9ec8c3e50de1d5af4524c26c6819e17b64090aa", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.3775406854616857, "ground_truth": 0}, {"key": "d9ec8c3e50de1d5af4524c26c6819e17b64090aa", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.49023563115844865, "ground_truth": 0}, {"key": "b6072611b97e8c19ba2d7e0dfce153f046dd629d", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.4130035985148658, "ground_truth": 0}, {"key": "b6072611b97e8c19ba2d7e0dfce153f046dd629d", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.4668455827594414, "ground_truth": 0}, {"key": "b6072611b97e8c19ba2d7e0dfce153f046dd629d", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.4301473544038717, "ground_truth": 0}, {"key": "b6072611b97e8c19ba2d7e0dfce153f046dd629d", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.4941408829702089, "ground_truth": 0}, {"key": "b6072611b97e8c19ba2d7e0dfce153f046dd629d", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.5253688236101124, "ground_truth": 0}, {"key": "2cf81cee664ebcb027a48259e34e512a79aceecb", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.7233094540928582, "ground_truth": 0}, {"key": "2cf81cee664ebcb027a48259e34e512a79aceecb", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.7233094715174426, "ground_truth": 0}, {"key": "2cf81cee664ebcb027a48259e34e512a79aceecb", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.8080672370199651, "ground_truth": 0}, {"key": "2cf81cee664ebcb027a48259e34e512a79aceecb", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.7446563241262506, "ground_truth": 0}, {"key": "2cf81cee664ebcb027a48259e34e512a79aceecb", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.8529354923108887, "ground_truth": 0}, {"key": "b037b44fc06a2d89d95dc7b4453b87371a34fe2f", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.844921525746041, "ground_truth": 0}, {"key": "b037b44fc06a2d89d95dc7b4453b87371a34fe2f", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.6566582573696736, "ground_truth": 0}, {"key": "b037b44fc06a2d89d95dc7b4453b87371a34fe2f", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.6619228846593642, "ground_truth": 0}, {"key": "b037b44fc06a2d89d95dc7b4453b87371a34fe2f", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.767689844781237, "ground_truth": 0}, {"key": "b037b44fc06a2d89d95dc7b4453b87371a34fe2f", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.8128673229107123, "ground_truth": 0}, {"key": "b1ea881f21e2b58e247b5894d4f259cf86b4d1dd", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.7416740097270214, "ground_truth": 0}, {"key": "b1ea881f21e2b58e247b5894d4f259cf86b4d1dd", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.5583269959216428, "ground_truth": 0}, {"key": "b1ea881f21e2b58e247b5894d4f259cf86b4d1dd", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.6242935290966434, "ground_truth": 0}, {"key": "b1ea881f21e2b58e247b5894d4f259cf86b4d1dd", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.4960938204522877, "ground_truth": 0}, {"key": "b1ea881f21e2b58e247b5894d4f259cf86b4d1dd", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.8233284108339963, "ground_truth": 0}, {"key": "d80e6a3be826df05df00a87f49cc426fd597f085", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.9481545294638949, "ground_truth": 0}, {"key": "d80e6a3be826df05df00a87f49cc426fd597f085", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.959762055033955, "ground_truth": 0}, {"key": "d80e6a3be826df05df00a87f49cc426fd597f085", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.9362850054731132, "ground_truth": 0}, {"key": "d80e6a3be826df05df00a87f49cc426fd597f085", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.9532750407420345, "ground_truth": 0}, {"key": "d80e6a3be826df05df00a87f49cc426fd597f085", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.9314625039447589, "ground_truth": 0}, {"key": "05216d3837745866d393f0e07be7ba801dc330f6", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.8962513713479172, "ground_truth": 0}, {"key": "05216d3837745866d393f0e07be7ba801dc330f6", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.8479677445753857, "ground_truth": 0}, {"key": "05216d3837745866d393f0e07be7ba801dc330f6", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.8322366517902106, "ground_truth": 0}, {"key": "05216d3837745866d393f0e07be7ba801dc330f6", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.9032942092126515, "ground_truth": 0}, {"key": "05216d3837745866d393f0e07be7ba801dc330f6", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.918480250479454, "ground_truth": 0}, {"key": "a204e3551445183cf53ae355e532a2db731c0c30", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.4054487367671542, "ground_truth": 0}, {"key": "a204e3551445183cf53ae355e532a2db731c0c30", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.36840569043344296, "ground_truth": 0}, {"key": "a204e3551445183cf53ae355e532a2db731c0c30", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.41679663956816143, "ground_truth": 0}, {"key": "a204e3551445183cf53ae355e532a2db731c0c30", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.649578624526353, "ground_truth": 0}, {"key": "a204e3551445183cf53ae355e532a2db731c0c30", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.3757064664150621, "ground_truth": 0}, {"key": "047e7bc4c7ea5f7df08d4efc443ac8a3479649f1", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.8128673145903906, "ground_truth": 0}, {"key": "047e7bc4c7ea5f7df08d4efc443ac8a3479649f1", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.9246876905357347, "ground_truth": 0}, {"key": "047e7bc4c7ea5f7df08d4efc443ac8a3479649f1", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.7310585788912785, "ground_truth": 0}, {"key": "047e7bc4c7ea5f7df08d4efc443ac8a3479649f1", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.9319595758947611, "ground_truth": 0}, {"key": "047e7bc4c7ea5f7df08d4efc443ac8a3479649f1", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.8643104580603748, "ground_truth": 0}, {"key": "dee467e11f253e70ec843c45fb373da06eace6be", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.8918110498697421, "ground_truth": 0}, {"key": "dee467e11f253e70ec843c45fb373da06eace6be", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.9289263260661338, "ground_truth": 0}, {"key": "dee467e11f253e70ec843c45fb373da06eace6be", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.9219218288379698, "ground_truth": 0}, {"key": "dee467e11f253e70ec843c45fb373da06eace6be", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.97068776842728, "ground_truth": 0}, {"key": "dee467e11f253e70ec843c45fb373da06eace6be", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.9161096157240943, "ground_truth": 0}, {"key": "054891b9199a73152564cc5be925250ea282bb00", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.4571367083247216, "ground_truth": 0}, {"key": "054891b9199a73152564cc5be925250ea282bb00", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.4378235012605507, "ground_truth": 0}, {"key": "054891b9199a73152564cc5be925250ea282bb00", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.24798744392901784, "ground_truth": 0}, {"key": "054891b9199a73152564cc5be925250ea282bb00", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.4186969040087063, "ground_truth": 0}, {"key": "054891b9199a73152564cc5be925250ea282bb00", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.49609384303953835, "ground_truth": 0}, {"key": "82a94cf607660eb67aac057e3f5028c4cae75abf", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.5019531193098462, "ground_truth": 0}, {"key": "82a94cf607660eb67aac057e3f5028c4cae75abf", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.5983122030693047, "ground_truth": 0}, {"key": "82a94cf607660eb67aac057e3f5028c4cae75abf", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.6654105740612449, "ground_truth": 0}, {"key": "82a94cf607660eb67aac057e3f5028c4cae75abf", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.7371581491139845, "ground_truth": 0}, {"key": "82a94cf607660eb67aac057e3f5028c4cae75abf", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.6909762941709943, "ground_truth": 0}, {"key": "58bf14c936eb7e9a6561599014fefd77ef6c457e", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.8925625269878353, "ground_truth": 0}, {"key": "58bf14c936eb7e9a6561599014fefd77ef6c457e", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.865224076677395, "ground_truth": 0}, {"key": "58bf14c936eb7e9a6561599014fefd77ef6c457e", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.8568122945119732, "ground_truth": 0}, {"key": "58bf14c936eb7e9a6561599014fefd77ef6c457e", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.8872045961718346, "ground_truth": 0}, {"key": "58bf14c936eb7e9a6561599014fefd77ef6c457e", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.764891620841675, "ground_truth": 0}, {"key": "5574fe023e3127f0c206ac89eb06abf5a7400438", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.1980641775302838, "ground_truth": 0}, {"key": "5574fe023e3127f0c206ac89eb06abf5a7400438", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.2200070949992841, "ground_truth": 0}, {"key": "5574fe023e3127f0c206ac89eb06abf5a7400438", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.3575675189907932, "ground_truth": 0}, {"key": "5574fe023e3127f0c206ac89eb06abf5a7400438", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.14128142415681214, "ground_truth": 0}, {"key": "5574fe023e3127f0c206ac89eb06abf5a7400438", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.22405546008935515, "ground_truth": 0}, {"key": "e88be1fa30cb6557d422788b5c469b7ba7ca8bfc", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.6825737232772373, "ground_truth": 0}, {"key": "e88be1fa30cb6557d422788b5c469b7ba7ca8bfc", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.7853085857243771, "ground_truth": 0}, {"key": "e88be1fa30cb6557d422788b5c469b7ba7ca8bfc", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.27982850725882236, "ground_truth": 0}, {"key": "e88be1fa30cb6557d422788b5c469b7ba7ca8bfc", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.6513548438103546, "ground_truth": 0}, {"key": "e88be1fa30cb6557d422788b5c469b7ba7ca8bfc", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.8489721972960058, "ground_truth": 0}, {"key": "62f05476ec5198ceb345ce4f45d7d0e70f499ad7", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.45907611827568395, "ground_truth": 0}, {"key": "62f05476ec5198ceb345ce4f45d7d0e70f499ad7", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.5983121923194171, "ground_truth": 0}, {"key": "62f05476ec5198ceb345ce4f45d7d0e70f499ad7", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.4016878120450134, "ground_truth": 0}, {"key": "62f05476ec5198ceb345ce4f45d7d0e70f499ad7", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.4551986295852928, "ground_truth": 0}, {"key": "62f05476ec5198ceb345ce4f45d7d0e70f499ad7", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.5851011569708775, "ground_truth": 0}, {"key": "8cc719f761556a81a71c2dd1b703749c2059df10", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.8092759817704586, "ground_truth": 0}, {"key": "8cc719f761556a81a71c2dd1b703749c2059df10", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.9149009628059532, "ground_truth": 0}, {"key": "8cc719f761556a81a71c2dd1b703749c2059df10", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.8255897283846286, "ground_truth": 0}, {"key": "8cc719f761556a81a71c2dd1b703749c2059df10", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.5926666085059777, "ground_truth": 0}, {"key": "8cc719f761556a81a71c2dd1b703749c2059df10", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.9224823444425385, "ground_truth": 0}, {"key": "2d89b0d0827a0a1e9e855de7717407cdff63b1f5", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.4301473702028717, "ground_truth": 0}, {"key": "2d89b0d0827a0a1e9e855de7717407cdff63b1f5", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.4746311541679514, "ground_truth": 0}, {"key": "2d89b0d0827a0a1e9e855de7717407cdff63b1f5", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.32082131331787084, "ground_truth": 0}, {"key": "2d89b0d0827a0a1e9e855de7717407cdff63b1f5", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.4785288286471344, "ground_truth": 0}, {"key": "2d89b0d0827a0a1e9e855de7717407cdff63b1f5", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.25091276674667645, "ground_truth": 0}, {"key": "41431356e1e7c6f94057b262cd284987f9edb184", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.626124179294219, "ground_truth": 0}, {"key": "41431356e1e7c6f94057b262cd284987f9edb184", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.48047867665347505, "ground_truth": 0}, {"key": "41431356e1e7c6f94057b262cd284987f9edb184", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.4130035752882671, "ground_truth": 0}, {"key": "41431356e1e7c6f94057b262cd284987f9edb184", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.5214711637050427, "ground_truth": 0}, {"key": "41431356e1e7c6f94057b262cd284987f9edb184", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.39233683011387743, "ground_truth": 0}, {"key": "50872fa30632af8f4c65fb9f952ea8e1b13043c9", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.35042136348458586, "ground_truth": 0}, {"key": "50872fa30632af8f4c65fb9f952ea8e1b13043c9", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.3276682916310484, "ground_truth": 0}, {"key": "50872fa30632af8f4c65fb9f952ea8e1b13043c9", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.5448013969518276, "ground_truth": 0}, {"key": "50872fa30632af8f4c65fb9f952ea8e1b13043c9", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.41679666699346973, "ground_truth": 0}, {"key": "50872fa30632af8f4c65fb9f952ea8e1b13043c9", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.5506073516325741, "ground_truth": 0}, {"key": "4a403faad8116c40f4cb960d3ffad081106341ad", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.2643583584570233, "ground_truth": 0}, {"key": "4a403faad8116c40f4cb960d3ffad081106341ad", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.3040416886430727, "ground_truth": 0}, {"key": "4a403faad8116c40f4cb960d3ffad081106341ad", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.18594720337286036, "ground_truth": 0}, {"key": "4a403faad8116c40f4cb960d3ffad081106341ad", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.19193279985238595, "ground_truth": 0}, {"key": "4a403faad8116c40f4cb960d3ffad081106341ad", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.3720487627772953, "ground_truth": 0}, {"key": "6f6964470c122807573653173b45b8e00bb59696", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.7090191501294807, "ground_truth": 0}, {"key": "6f6964470c122807573653173b45b8e00bb59696", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.5058591219705171, "ground_truth": 0}, {"key": "6f6964470c122807573653173b45b8e00bb59696", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.7008948106152225, "ground_truth": 0}, {"key": "6f6964470c122807573653173b45b8e00bb59696", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.8529354754891441, "ground_truth": 0}, {"key": "6f6964470c122807573653173b45b8e00bb59696", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.8092759795670901, "ground_truth": 0}, {"key": "75c6e27a38b72bb9f75fa2b8e45e933bae10dac5", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.8705972746550873, "ground_truth": 0}, {"key": "75c6e27a38b72bb9f75fa2b8e45e933bae10dac5", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.7264255914175192, "ground_truth": 0}, {"key": "75c6e27a38b72bb9f75fa2b8e45e933bae10dac5", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.6825737442077102, "ground_truth": 0}, {"key": "75c6e27a38b72bb9f75fa2b8e45e933bae10dac5", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.8233283836847269, "ground_truth": 0}, {"key": "75c6e27a38b72bb9f75fa2b8e45e933bae10dac5", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.7931059348325801, "ground_truth": 0}, {"key": "9aa6463127d1efcba4403a185b29849a3688db8d", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.8714748638029537, "ground_truth": 0}, {"key": "9aa6463127d1efcba4403a185b29849a3688db8d", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.6548947359131021, "ground_truth": 0}, {"key": "9aa6463127d1efcba4403a185b29849a3688db8d", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.8233283867781099, "ground_truth": 0}, {"key": "9aa6463127d1efcba4403a185b29849a3688db8d", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.6791787246106362, "ground_truth": 0}, {"key": "9aa6463127d1efcba4403a185b29849a3688db8d", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.81167601367745, "ground_truth": 0}, {"key": "97eda06b374f07cd9495962465775bde7d44da31", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.4092207676517542, "ground_truth": 0}, {"key": "97eda06b374f07cd9495962465775bde7d44da31", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.36840566131275704, "ground_truth": 0}, {"key": "97eda06b374f07cd9495962465775bde7d44da31", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.7170118948499103, "ground_truth": 0}, {"key": "97eda06b374f07cd9495962465775bde7d44da31", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.5019531254344759, "ground_truth": 0}, {"key": "97eda06b374f07cd9495962465775bde7d44da31", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.5234203306857067, "ground_truth": 0}, {"key": "99a6049d67c1cee35f9703ccb8e6f62a4928295a", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.4571367046680304, "ground_truth": 0}, {"key": "99a6049d67c1cee35f9703ccb8e6f62a4928295a", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.47268345028154035, "ground_truth": 0}, {"key": "99a6049d67c1cee35f9703ccb8e6f62a4928295a", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.2751297273936125, "ground_truth": 0}, {"key": "99a6049d67c1cee35f9703ccb8e6f62a4928295a", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.39793840518055623, "ground_truth": 0}, {"key": "99a6049d67c1cee35f9703ccb8e6f62a4928295a", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.37937841197692357, "ground_truth": 0}, {"key": "adcb3e7b4bef0f9efe7a838b56131ca99b587743", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.42059959361748217, "ground_truth": 0}, {"key": "adcb3e7b4bef0f9efe7a838b56131ca99b587743", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.31912137608082863, "ground_truth": 0}, {"key": "adcb3e7b4bef0f9efe7a838b56131ca99b587743", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.3812195764872157, "ground_truth": 0}, {"key": "adcb3e7b4bef0f9efe7a838b56131ca99b587743", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.34334173886787284, "ground_truth": 0}, {"key": "adcb3e7b4bef0f9efe7a838b56131ca99b587743", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.548673495341467, "ground_truth": 0}, {"key": "bf7cc4e7872b7471a8ef858b8aa45eca090171da", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.7371581537035381, "ground_truth": 0}, {"key": "bf7cc4e7872b7471a8ef858b8aa45eca090171da", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.6654105668753184, "ground_truth": 0}, {"key": "bf7cc4e7872b7471a8ef858b8aa45eca090171da", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.7634837631470914, "ground_truth": 0}, {"key": "bf7cc4e7872b7471a8ef858b8aa45eca090171da", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.7853085778062745, "ground_truth": 0}, {"key": "bf7cc4e7872b7471a8ef858b8aa45eca090171da", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.6757645957681332, "ground_truth": 0}, {"key": "62785b99e4007fad95ce55d427046e14aef476a4", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.7325918157920043, "ground_truth": 0}, {"key": "62785b99e4007fad95ce55d427046e14aef476a4", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.5717666015132968, "ground_truth": 0}, {"key": "62785b99e4007fad95ce55d427046e14aef476a4", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.2005576781880203, "ground_truth": 0}, {"key": "62785b99e4007fad95ce55d427046e14aef476a4", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.6020615910553977, "ground_truth": 0}, {"key": "62785b99e4007fad95ce55d427046e14aef476a4", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.49218811441977184, "ground_truth": 0}, {"key": "62fcd4ca096a182c292ae3609444bbc7af15eab6", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.7839884753971774, "ground_truth": 0}, {"key": "62fcd4ca096a182c292ae3609444bbc7af15eab6", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.5660185329894115, "ground_truth": 0}, {"key": "62fcd4ca096a182c292ae3609444bbc7af15eab6", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.616935839156297, "ground_truth": 0}, {"key": "62fcd4ca096a182c292ae3609444bbc7af15eab6", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.6261241868378494, "ground_truth": 0}, {"key": "62fcd4ca096a182c292ae3609444bbc7af15eab6", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.8210441322836796, "ground_truth": 0}, {"key": "afdbd1bc7c79a936601b3c6cae4622464641d3a5", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.7090191396207911, "ground_truth": 0}, {"key": "afdbd1bc7c79a936601b3c6cae4622464641d3a5", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.7057850376420162, "ground_truth": 0}, {"key": "afdbd1bc7c79a936601b3c6cae4622464641d3a5", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.5583269834248628, "ground_truth": 0}, {"key": "afdbd1bc7c79a936601b3c6cae4622464641d3a5", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.7461389909496667, "ground_truth": 0}, {"key": "afdbd1bc7c79a936601b3c6cae4622464641d3a5", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.8244619470296833, "ground_truth": 0}, {"key": "2a2a0fd7b85ec6f9145761795bae420d7eb84f44", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.7431680249010773, "ground_truth": 0}, {"key": "2a2a0fd7b85ec6f9145761795bae420d7eb84f44", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.7310585819485983, "ground_truth": 0}, {"key": "2a2a0fd7b85ec6f9145761795bae420d7eb84f44", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.713830773352728, "ground_truth": 0}, {"key": "2a2a0fd7b85ec6f9145761795bae420d7eb84f44", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.7041601341294899, "ground_truth": 0}, {"key": "2a2a0fd7b85ec6f9145761795bae420d7eb84f44", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.6926419952056807, "ground_truth": 0}, {"key": "f3d07208d0059d738fc7788a4ce813309b677d7b", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.7918210668298356, "ground_truth": 0}, {"key": "f3d07208d0059d738fc7788a4ce813309b677d7b", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.7634837744303099, "ground_truth": 0}, {"key": "f3d07208d0059d738fc7788a4ce813309b677d7b", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.7356416431016701, "ground_truth": 0}, {"key": "f3d07208d0059d738fc7788a4ce813309b677d7b", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.7401743672354425, "ground_truth": 0}, {"key": "f3d07208d0059d738fc7788a4ce813309b677d7b", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.7446563368162932, "ground_truth": 0}, {"key": "2b8840981769a4a8f93d2e82e609ab169165cd3c", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.40356684238902296, "ground_truth": 0}, {"key": "2b8840981769a4a8f93d2e82e609ab169165cd3c", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.6442251135201793, "ground_truth": 0}, {"key": "2b8840981769a4a8f93d2e82e609ab169165cd3c", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.7520125740109728, "ground_truth": 0}, {"key": "2b8840981769a4a8f93d2e82e609ab169165cd3c", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.560252660267455, "ground_truth": 0}, {"key": "2b8840981769a4a8f93d2e82e609ab169165cd3c", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.7233094446690591, "ground_truth": 0}, {"key": "4b23ce1db7253bf118b493c9bea7d6899012cc88", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.542863292953094, "ground_truth": 0}, {"key": "4b23ce1db7253bf118b493c9bea7d6899012cc88", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.6495786021334182, "ground_truth": 0}, {"key": "4b23ce1db7253bf118b493c9bea7d6899012cc88", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.4551986042648165, "ground_truth": 0}, {"key": "4b23ce1db7253bf118b493c9bea7d6899012cc88", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.43398147341512777, "ground_truth": 0}, {"key": "4b23ce1db7253bf118b493c9bea7d6899012cc88", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.4054487288915168, "ground_truth": 0}, {"key": "c220780a60f76cdd1f6fd9a84abac736c3ee8ace", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.7690802420848571, "ground_truth": 0}, {"key": "c220780a60f76cdd1f6fd9a84abac736c3ee8ace", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.7138307533802088, "ground_truth": 0}, {"key": "c220780a60f76cdd1f6fd9a84abac736c3ee8ace", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.6619228773311894, "ground_truth": 0}, {"key": "c220780a60f76cdd1f6fd9a84abac736c3ee8ace", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.692641999835683, "ground_truth": 0}, {"key": "c220780a60f76cdd1f6fd9a84abac736c3ee8ace", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.8333246043865972, "ground_truth": 0}, {"key": "9c7687a36469fc0e2203edb31f303274a611fb12", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.10594827914250025, "ground_truth": 0}, {"key": "9c7687a36469fc0e2203edb31f303274a611fb12", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.4205995786109219, "ground_truth": 0}, {"key": "9c7687a36469fc0e2203edb31f303274a611fb12", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.06754669327355634, "ground_truth": 0}, {"key": "9c7687a36469fc0e2203edb31f303274a611fb12", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.16132024309854728, "ground_truth": 0}, {"key": "9c7687a36469fc0e2203edb31f303274a611fb12", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.10743746787778076, "ground_truth": 0}, {"key": "8ab7fe3b19bb45c977cb74ed675579a20611ad9b", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.5851011422040847, "ground_truth": 0}, {"key": "8ab7fe3b19bb45c977cb74ed675579a20611ad9b", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.5679366340312453, "ground_truth": 0}, {"key": "8ab7fe3b19bb45c977cb74ed675579a20611ad9b", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.5869964083852457, "ground_truth": 0}, {"key": "8ab7fe3b19bb45c977cb74ed675579a20611ad9b", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.2974699441652736, "ground_truth": 0}, {"key": "8ab7fe3b19bb45c977cb74ed675579a20611ad9b", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.5467381303550366, "ground_truth": 0}, {"key": "dfedf6786976733d8e33e7848ea8a7aa735bbcab", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.5869964332558127, "ground_truth": 0}, {"key": "dfedf6786976733d8e33e7848ea8a7aa735bbcab", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.5195213413815492, "ground_truth": 0}, {"key": "dfedf6786976733d8e33e7848ea8a7aa735bbcab", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.7853085782662432, "ground_truth": 0}, {"key": "dfedf6786976733d8e33e7848ea8a7aa735bbcab", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.38676345762802383, "ground_truth": 0}, {"key": "dfedf6786976733d8e33e7848ea8a7aa735bbcab", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.5621764966537449, "ground_truth": 0}, {"key": "825f58580dd78cdcc7fbc10a00807e043c7b4468", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.5078118746815531, "ground_truth": 0}, {"key": "825f58580dd78cdcc7fbc10a00807e043c7b4468", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.6442251156129813, "ground_truth": 0}, {"key": "825f58580dd78cdcc7fbc10a00807e043c7b4468", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.6370308007866289, "ground_truth": 0}, {"key": "825f58580dd78cdcc7fbc10a00807e043c7b4468", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.5660185299331693, "ground_truth": 0}, {"key": "825f58580dd78cdcc7fbc10a00807e043c7b4468", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.3522017702042048, "ground_truth": 0}, {"key": "8bd6dc9f3ebb23fe20f74c1956184064b5b95509", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.3106943809853017, "ground_truth": 0}, {"key": "8bd6dc9f3ebb23fe20f74c1956184064b5b95509", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.4282333794708553, "ground_truth": 0}, {"key": "8bd6dc9f3ebb23fe20f74c1956184064b5b95509", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.3040416671106766, "ground_truth": 0}, {"key": "8bd6dc9f3ebb23fe20f74c1956184064b5b95509", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.396068177564203, "ground_truth": 0}, {"key": "8bd6dc9f3ebb23fe20f74c1956184064b5b95509", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.4167966483582527, "ground_truth": 0}, {"key": "a7f6d4487a3ba7c4fc29e9b410820891f4c4f086", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.8848377678483699, "ground_truth": 0}, {"key": "a7f6d4487a3ba7c4fc29e9b410820891f4c4f086", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.9173026525689792, "ground_truth": 0}, {"key": "a7f6d4487a3ba7c4fc29e9b410820891f4c4f086", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.9155072394972145, "ground_truth": 0}, {"key": "a7f6d4487a3ba7c4fc29e9b410820891f4c4f086", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.862467548024575, "ground_truth": 0}, {"key": "a7f6d4487a3ba7c4fc29e9b410820891f4c4f086", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.9079671469858946, "ground_truth": 0}, {"key": "b27ad09982665477dacdb7d06a33134bf064dd8d", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.7943849469803284, "ground_truth": 0}, {"key": "b27ad09982665477dacdb7d06a33134bf064dd8d", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.7431680025516122, "ground_truth": 0}, {"key": "b27ad09982665477dacdb7d06a33134bf064dd8d", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.6315942869766112, "ground_truth": 0}, {"key": "b27ad09982665477dacdb7d06a33134bf064dd8d", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.5964331664607522, "ground_truth": 0}, {"key": "b27ad09982665477dacdb7d06a33134bf064dd8d", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.7476159573659419, "ground_truth": 0}, {"key": "905891c3a21e76ad63d63dfe55e569a4cab25583", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.3867634352412511, "ground_truth": 0}, {"key": "905891c3a21e76ad63d63dfe55e569a4cab25583", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.654894706391696, "ground_truth": 0}, {"key": "905891c3a21e76ad63d63dfe55e569a4cab25583", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.7356416324590489, "ground_truth": 0}, {"key": "905891c3a21e76ad63d63dfe55e569a4cab25583", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.6224593293675109, "ground_truth": 0}, {"key": "905891c3a21e76ad63d63dfe55e569a4cab25583", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.451326520063063, "ground_truth": 0}, {"key": "626460b8ec58252c82ff5513aa754190332780aa", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.22815651638904552, "ground_truth": 0}, {"key": "626460b8ec58252c82ff5513aa754190332780aa", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.39047582462256003, "ground_truth": 0}, {"key": "626460b8ec58252c82ff5513aa754190332780aa", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.3942009234525309, "ground_truth": 0}, {"key": "626460b8ec58252c82ff5513aa754190332780aa", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.3522017619904469, "ground_truth": 0}, {"key": "626460b8ec58252c82ff5513aa754190332780aa", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.36658972620709523, "ground_truth": 0}, {"key": "31d0ed7b1b8f65c6479fb35683d72de21d70796a", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.905989815244727, "ground_truth": 0}, {"key": "31d0ed7b1b8f65c6479fb35683d72de21d70796a", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.9549844666540929, "ground_truth": 0}, {"key": "31d0ed7b1b8f65c6479fb35683d72de21d70796a", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.9489172613667071, "ground_truth": 0}, {"key": "31d0ed7b1b8f65c6479fb35683d72de21d70796a", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.9481545311558673, "ground_truth": 0}, {"key": "31d0ed7b1b8f65c6479fb35683d72de21d70796a", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.9730364997618558, "ground_truth": 0}, {"key": "b03ee4df6492038d0a1d99a1717d8ad8ccc06db3", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.6688802464728923, "ground_truth": 0}, {"key": "b03ee4df6492038d0a1d99a1717d8ad8ccc06db3", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.609524184692024, "ground_truth": 0}, {"key": "b03ee4df6492038d0a1d99a1717d8ad8ccc06db3", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.618780431660465, "ground_truth": 0}, {"key": "b03ee4df6492038d0a1d99a1717d8ad8ccc06db3", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.8529354788118996, "ground_truth": 0}, {"key": "b03ee4df6492038d0a1d99a1717d8ad8ccc06db3", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.6057990560420918, "ground_truth": 0}, {"key": "ad9abc78fb2de88267b854f2aed110e2a5b8c3f1", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.983085087214119, "ground_truth": 0}, {"key": "ad9abc78fb2de88267b854f2aed110e2a5b8c3f1", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.8749346176225676, "ground_truth": 0}, {"key": "ad9abc78fb2de88267b854f2aed110e2a5b8c3f1", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.9738443812272999, "ground_truth": 0}, {"key": "ad9abc78fb2de88267b854f2aed110e2a5b8c3f1", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.9539660996597393, "ground_truth": 0}, {"key": "ad9abc78fb2de88267b854f2aed110e2a5b8c3f1", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.9118099590618091, "ground_truth": 0}, {"key": "75cc16a7ba1970ba791da4ba43e6220f37f47697", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.8116760039007939, "ground_truth": 0}, {"key": "75cc16a7ba1970ba791da4ba43e6220f37f47697", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.7606506692557755, "ground_truth": 0}, {"key": "75cc16a7ba1970ba791da4ba43e6220f37f47697", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.6113819760907886, "ground_truth": 0}, {"key": "75cc16a7ba1970ba791da4ba43e6220f37f47697", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.847967748663765, "ground_truth": 0}, {"key": "75cc16a7ba1970ba791da4ba43e6220f37f47697", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.7371581565666104, "ground_truth": 0}, {"key": "fe9d63d0ed719a42735cadaf10e76416545f680c", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.5964331340930685, "ground_truth": 0}, {"key": "fe9d63d0ed719a42735cadaf10e76416545f680c", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.6039318491343241, "ground_truth": 0}, {"key": "fe9d63d0ed719a42735cadaf10e76416545f680c", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.40544875928452395, "ground_truth": 0}, {"key": "fe9d63d0ed719a42735cadaf10e76416545f680c", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.5058591211885936, "ground_truth": 0}, {"key": "fe9d63d0ed719a42735cadaf10e76416545f680c", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.4263216003038489, "ground_truth": 0}, {"key": "1744093a3fea8b8de0777b1a228c3ba3e515d48e", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.3775406660719137, "ground_truth": 0}, {"key": "1744093a3fea8b8de0777b1a228c3ba3e515d48e", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.5019531264091116, "ground_truth": 0}, {"key": "1744093a3fea8b8de0777b1a228c3ba3e515d48e", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.35398629708286966, "ground_truth": 0}, {"key": "1744093a3fea8b8de0777b1a228c3ba3e515d48e", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.1699562315872948, "ground_truth": 0}, {"key": "1744093a3fea8b8de0777b1a228c3ba3e515d48e", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.464901586941905, "ground_truth": 0}, {"key": "4929479f70e89deb22539e7d2caa6c33bbb0a14f", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.5253688086876304, "ground_truth": 0}, {"key": "4929479f70e89deb22539e7d2caa6c33bbb0a14f", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.34334173886772745, "ground_truth": 0}, {"key": "4929479f70e89deb22539e7d2caa6c33bbb0a14f", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.3023910783872596, "ground_truth": 0}, {"key": "4929479f70e89deb22539e7d2caa6c33bbb0a14f", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.6297746239596419, "ground_truth": 0}, {"key": "4929479f70e89deb22539e7d2caa6c33bbb0a14f", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.5195213288699941, "ground_truth": 0}, {"key": "4dd3bb1fe7a5b0d42f0df8d9e62b81c673475420", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.8479677518519108, "ground_truth": 0}, {"key": "4dd3bb1fe7a5b0d42f0df8d9e62b81c673475420", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.891054955090385, "ground_truth": 0}, {"key": "4dd3bb1fe7a5b0d42f0df8d9e62b81c673475420", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.9053223087581561, "ground_truth": 0}, {"key": "4dd3bb1fe7a5b0d42f0df8d9e62b81c673475420", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.8187367977573529, "ground_truth": 0}, {"key": "4dd3bb1fe7a5b0d42f0df8d9e62b81c673475420", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.837619960545085, "ground_truth": 0}, {"key": "32f0c7b0845e88c7ff34bb9d358a86e029dc2261", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.47657965529326757, "ground_truth": 0}, {"key": "32f0c7b0845e88c7ff34bb9d358a86e029dc2261", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.5679366340312453, "ground_truth": 0}, {"key": "32f0c7b0845e88c7ff34bb9d358a86e029dc2261", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.7662936499306641, "ground_truth": 0}, {"key": "32f0c7b0845e88c7ff34bb9d358a86e029dc2261", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.3363310325424964, "ground_truth": 0}, {"key": "32f0c7b0845e88c7ff34bb9d358a86e029dc2261", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.5467381303550366, "ground_truth": 0}, {"key": "607ce3caeeac56d7c4250aaa161871535cd1251e", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.4167966465107502, "ground_truth": 0}, {"key": "607ce3caeeac56d7c4250aaa161871535cd1251e", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.6808786375540082, "ground_truth": 0}, {"key": "607ce3caeeac56d7c4250aaa161871535cd1251e", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.6206215948143775, "ground_truth": 0}, {"key": "607ce3caeeac56d7c4250aaa161871535cd1251e", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.6943026799669, "ground_truth": 0}, {"key": "607ce3caeeac56d7c4250aaa161871535cd1251e", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.6460137009220995, "ground_truth": 0}, {"key": "7fb19f75d5d3feefeababf62d2ac91bf684a8038", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.7994423075219971, "ground_truth": 0}, {"key": "7fb19f75d5d3feefeababf62d2ac91bf684a8038", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.7839884592929768, "ground_truth": 0}, {"key": "7fb19f75d5d3feefeababf62d2ac91bf684a8038", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.6352224342525764, "ground_truth": 0}, {"key": "7fb19f75d5d3feefeababf62d2ac91bf684a8038", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.8577681149246804, "ground_truth": 0}, {"key": "7fb19f75d5d3feefeababf62d2ac91bf684a8038", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.8596637441343834, "ground_truth": 0}, {"key": "4a70f83728ee66801be719df00060cda4c25817f", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.42632157651441444, "ground_truth": 0}, {"key": "4a70f83728ee66801be719df00060cda4c25817f", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.3867634454744672, "ground_truth": 0}, {"key": "4a70f83728ee66801be719df00060cda4c25817f", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.6261241892888304, "ground_truth": 0}, {"key": "4a70f83728ee66801be719df00060cda4c25817f", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.34687307913032606, "ground_truth": 0}, {"key": "4a70f83728ee66801be719df00060cda4c25817f", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.4804786877191918, "ground_truth": 0}, {"key": "dcfc0e6ff732124026991e89d50727876f50351f", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.7138307467185933, "ground_truth": 0}, {"key": "dcfc0e6ff732124026991e89d50727876f50351f", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.8606036156896762, "ground_truth": 0}, {"key": "dcfc0e6ff732124026991e89d50727876f50351f", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.8976952977167013, "ground_truth": 0}, {"key": "dcfc0e6ff732124026991e89d50727876f50351f", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.7461389848982006, "ground_truth": 0}, {"key": "dcfc0e6ff732124026991e89d50727876f50351f", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.6442250963963081, "ground_truth": 0}, {"key": "ace7f6d9e984397bda16bf441019f1584f036b2a", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.9740426425514481, "ground_truth": 0}, {"key": "ace7f6d9e984397bda16bf441019f1584f036b2a", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.9635062331339453, "ground_truth": 0}, {"key": "ace7f6d9e984397bda16bf441019f1584f036b2a", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.9681411424616932, "ground_truth": 0}, {"key": "ace7f6d9e984397bda16bf441019f1584f036b2a", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.9683812329813217, "ground_truth": 0}, {"key": "ace7f6d9e984397bda16bf441019f1584f036b2a", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.954984470414588, "ground_truth": 0}, {"key": "6f12c9d47e70bfa86d72685d018ddd1161157e8e", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.5409238713293536, "ground_truth": 0}, {"key": "6f12c9d47e70bfa86d72685d018ddd1161157e8e", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.6842640298337811, "ground_truth": 0}, {"key": "6f12c9d47e70bfa86d72685d018ddd1161157e8e", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.7185944004611811, "ground_truth": 0}, {"key": "6f12c9d47e70bfa86d72685d018ddd1161157e8e", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.5869964227250611, "ground_truth": 0}, {"key": "6f12c9d47e70bfa86d72685d018ddd1161157e8e", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.5869964191841239, "ground_truth": 0}, {"key": "b32b72e5cf9e133e5be33eccbb2dc9ab5578ae84", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.5945512665589995, "ground_truth": 0}, {"key": "b32b72e5cf9e133e5be33eccbb2dc9ab5578ae84", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.6370307909993514, "ground_truth": 0}, {"key": "b32b72e5cf9e133e5be33eccbb2dc9ab5578ae84", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.5253688265214954, "ground_truth": 0}, {"key": "b32b72e5cf9e133e5be33eccbb2dc9ab5578ae84", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.5078118636767429, "ground_truth": 0}, {"key": "b32b72e5cf9e133e5be33eccbb2dc9ab5578ae84", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.4785288439868402, "ground_truth": 0}, {"key": "0ae5e35dc2844afc251d082d8d5ef4be8edce58c", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.6297746255214183, "ground_truth": 0}, {"key": "0ae5e35dc2844afc251d082d8d5ef4be8edce58c", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.8210441081631412, "ground_truth": 0}, {"key": "0ae5e35dc2844afc251d082d8d5ef4be8edce58c", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.6636689357472616, "ground_truth": 0}, {"key": "0ae5e35dc2844afc251d082d8d5ef4be8edce58c", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.611381987748094, "ground_truth": 0}, {"key": "0ae5e35dc2844afc251d082d8d5ef4be8edce58c", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.7648916056421793, "ground_truth": 0}, {"key": "ffb817ce85d7c19720ebbf0b43b01d0da61e9c06", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.3468730751732678, "ground_truth": 0}, {"key": "ffb817ce85d7c19720ebbf0b43b01d0da61e9c06", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.5525397418760977, "ground_truth": 0}, {"key": "ffb817ce85d7c19720ebbf0b43b01d0da61e9c06", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.5331543771901595, "ground_truth": 0}, {"key": "ffb817ce85d7c19720ebbf0b43b01d0da61e9c06", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.519521307220486, "ground_truth": 0}, {"key": "ffb817ce85d7c19720ebbf0b43b01d0da61e9c06", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.4148988258392937, "ground_truth": 0}, {"key": "9bfd6a5beb4e8dec59ba6d805dc9349a401da51d", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.6926419722297401, "ground_truth": 0}, {"key": "9bfd6a5beb4e8dec59ba6d805dc9349a401da51d", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.45132650175417655, "ground_truth": 0}, {"key": "9bfd6a5beb4e8dec59ba6d805dc9349a401da51d", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.5486734840094517, "ground_truth": 0}, {"key": "9bfd6a5beb4e8dec59ba6d805dc9349a401da51d", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.5679366309270665, "ground_truth": 0}, {"key": "9bfd6a5beb4e8dec59ba6d805dc9349a401da51d", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.5888891237693072, "ground_truth": 0}, {"key": "dc7f4527bf654918c7a4bb19179949ecd5982c0f", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.8509646935966397, "ground_truth": 0}, {"key": "dc7f4527bf654918c7a4bb19179949ecd5982c0f", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.8019358222933913, "ground_truth": 0}, {"key": "dc7f4527bf654918c7a4bb19179949ecd5982c0f", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.8587185852909369, "ground_truth": 0}, {"key": "dc7f4527bf654918c7a4bb19179949ecd5982c0f", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.9213576212084073, "ground_truth": 0}, {"key": "dc7f4527bf654918c7a4bb19179949ecd5982c0f", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.9492946368162286, "ground_truth": 0}, {"key": "c60e77736087bc85b372a28b4724aae6dcf0b052", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.3191214028219333, "ground_truth": 0}, {"key": "c60e77736087bc85b372a28b4724aae6dcf0b052", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.2925953220470372, "ground_truth": 0}, {"key": "c60e77736087bc85b372a28b4724aae6dcf0b052", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.2553436464733901, "ground_truth": 0}, {"key": "c60e77736087bc85b372a28b4724aae6dcf0b052", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.2861692580880251, "ground_truth": 0}, {"key": "c60e77736087bc85b372a28b4724aae6dcf0b052", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.37204878975322914, "ground_truth": 0}, {"key": "e0953e2de7cf286ac1d87a41c62e37f21b7c7564", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.5273164983073133, "ground_truth": 0}, {"key": "e0953e2de7cf286ac1d87a41c62e37f21b7c7564", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.5583270009309923, "ground_truth": 0}, {"key": "e0953e2de7cf286ac1d87a41c62e37f21b7c7564", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.7310585525728014, "ground_truth": 0}, {"key": "e0953e2de7cf286ac1d87a41c62e37f21b7c7564", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.830043766129131, "ground_truth": 0}, {"key": "e0953e2de7cf286ac1d87a41c62e37f21b7c7564", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.7310585789975382, "ground_truth": 0}, {"key": "8b6f228661fd5f3170dc2c2e6b353e1d6c3859ec", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.12252321875504302, "ground_truth": 0}, {"key": "8b6f228661fd5f3170dc2c2e6b353e1d6c3859ec", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.16995623478122832, "ground_truth": 0}, {"key": "8b6f228661fd5f3170dc2c2e6b353e1d6c3859ec", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.6057990403854846, "ground_truth": 0}, {"key": "8b6f228661fd5f3170dc2c2e6b353e1d6c3859ec", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.3702253803683871, "ground_truth": 0}, {"key": "8b6f228661fd5f3170dc2c2e6b353e1d6c3859ec", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.30404166619943873, "ground_truth": 0}, {"key": "2f482e021caf07e2f07baf111c36d1587758f188", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.29259530983811965, "ground_truth": 0}, {"key": "2f482e021caf07e2f07baf111c36d1587758f188", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.36658973595544664, "ground_truth": 0}, {"key": "2f482e021caf07e2f07baf111c36d1587758f188", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.43014735721219244, "ground_truth": 0}, {"key": "2f482e021caf07e2f07baf111c36d1587758f188", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.4980468739081205, "ground_truth": 0}, {"key": "2f482e021caf07e2f07baf111c36d1587758f188", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.3174262648657977, "ground_truth": 0}, {"key": "dc8ce4207b91a323bf6e2fbab889efeed22aa428", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.46490155713734926, "ground_truth": 0}, {"key": "dc8ce4207b91a323bf6e2fbab889efeed22aa428", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.7461389961884222, "ground_truth": 0}, {"key": "dc8ce4207b91a323bf6e2fbab889efeed22aa428", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.600188354325836, "ground_truth": 0}, {"key": "dc8ce4207b91a323bf6e2fbab889efeed22aa428", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.6842640348600117, "ground_truth": 0}, {"key": "dc8ce4207b91a323bf6e2fbab889efeed22aa428", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.6076631559428821, "ground_truth": 0}, {"key": "22a9005fe99c5dd536a4f41de4eb59d4f633ef9e", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.6057990509779866, "ground_truth": 0}, {"key": "22a9005fe99c5dd536a4f41de4eb59d4f633ef9e", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.8918110413918137, "ground_truth": 0}, {"key": "22a9005fe99c5dd536a4f41de4eb59d4f633ef9e", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.8933094092215718, "ground_truth": 0}, {"key": "22a9005fe99c5dd536a4f41de4eb59d4f633ef9e", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.764891628779004, "ground_truth": 0}, {"key": "22a9005fe99c5dd536a4f41de4eb59d4f633ef9e", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.7866228125858586, "ground_truth": 0}, {"key": "1b00b2d2edef396855ad392f08a6e74550af569b", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.8633916071949045, "ground_truth": 0}, {"key": "1b00b2d2edef396855ad392f08a6e74550af569b", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.5983122158677799, "ground_truth": 0}, {"key": "1b00b2d2edef396855ad392f08a6e74550af569b", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.8187367910887613, "ground_truth": 0}, {"key": "1b00b2d2edef396855ad392f08a6e74550af569b", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.7853085866952209, "ground_truth": 0}, {"key": "1b00b2d2edef396855ad392f08a6e74550af569b", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.5058591249104656, "ground_truth": 0}, {"key": "9b43472077873c45e7f278418885ad028eb993e3", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.40733340422777936, "ground_truth": 0}, {"key": "9b43472077873c45e7f278418885ad028eb993e3", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.2309197594589616, "ground_truth": 0}, {"key": "9b43472077873c45e7f278418885ad028eb993e3", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.17781087457595238, "ground_truth": 0}, {"key": "9b43472077873c45e7f278418885ad028eb993e3", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.3040416747681887, "ground_truth": 0}, {"key": "9b43472077873c45e7f278418885ad028eb993e3", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.2782568041924907, "ground_truth": 0}, {"key": "281347d0e99bc099d6991a6a60e30dc13d558216", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.7799929040340311, "ground_truth": 0}, {"key": "281347d0e99bc099d6991a6a60e30dc13d558216", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.8606036183739475, "ground_truth": 0}, {"key": "281347d0e99bc099d6991a6a60e30dc13d558216", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.7201714906999881, "ground_truth": 0}, {"key": "281347d0e99bc099d6991a6a60e30dc13d558216", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.7648916246386791, "ground_truth": 0}, {"key": "281347d0e99bc099d6991a6a60e30dc13d558216", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.6706083139284136, "ground_truth": 0}, {"key": "703d248cce913a6036347aabd2ba011a7f660bf4", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.6893056063266858, "ground_truth": 0}, {"key": "703d248cce913a6036347aabd2ba011a7f660bf4", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.5195213332869874, "ground_truth": 0}, {"key": "703d248cce913a6036347aabd2ba011a7f660bf4", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.6020615877671606, "ground_truth": 0}, {"key": "703d248cce913a6036347aabd2ba011a7f660bf4", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.56217650897731, "ground_truth": 0}, {"key": "703d248cce913a6036347aabd2ba011a7f660bf4", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.6406358647401673, "ground_truth": 0}, {"key": "517b86691dda04f41123354c1b7a7bfe1290eadc", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.38121958286781854, "ground_truth": 0}, {"key": "517b86691dda04f41123354c1b7a7bfe1290eadc", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.3123700082013061, "ground_truth": 0}, {"key": "517b86691dda04f41123354c1b7a7bfe1290eadc", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.39420094945065853, "ground_truth": 0}, {"key": "517b86691dda04f41123354c1b7a7bfe1290eadc", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.46490157594015386, "ground_truth": 0}, {"key": "517b86691dda04f41123354c1b7a7bfe1290eadc", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.43974734172711344, "ground_truth": 0}, {"key": "7b361feeebfb078b80831d40d2ad8640c361e049", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.7248702691860326, "ground_truth": 0}, {"key": "7b361feeebfb078b80831d40d2ad8640c361e049", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.8428631550657235, "ground_truth": 0}, {"key": "7b361feeebfb078b80831d40d2ad8640c361e049", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.8044059235808366, "ground_truth": 0}, {"key": "7b361feeebfb078b80831d40d2ad8640c361e049", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.7057850297194257, "ground_truth": 0}, {"key": "7b361feeebfb078b80831d40d2ad8640c361e049", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.785308596014146, "ground_truth": 0}, {"key": "7d8e196095e4561ee4f01c650101f5591fce4a8d", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.28776780214196185, "ground_truth": 0}, {"key": "7d8e196095e4561ee4f01c650101f5591fce4a8d", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.4263215666134083, "ground_truth": 0}, {"key": "7d8e196095e4561ee4f01c650101f5591fce4a8d", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.2186693756608708, "ground_truth": 0}, {"key": "7d8e196095e4561ee4f01c650101f5591fce4a8d", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.4765796520603389, "ground_truth": 0}, {"key": "7d8e196095e4561ee4f01c650101f5591fce4a8d", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.4551986031015672, "ground_truth": 0}, {"key": "ae03390949407f55c8d8f794896af3020d180b12", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.29583986658905487, "ground_truth": 0}, {"key": "ae03390949407f55c8d8f794896af3020d180b12", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.13660839627152496, "ground_truth": 0}, {"key": "ae03390949407f55c8d8f794896af3020d180b12", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.16132023827048658, "ground_truth": 0}, {"key": "ae03390949407f55c8d8f794896af3020d180b12", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.2407746030591144, "ground_truth": 0}, {"key": "ae03390949407f55c8d8f794896af3020d180b12", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.18359362488137104, "ground_truth": 0}, {"key": "4160464d3fcba547cb1664e54ce51ad06f78b773", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.6976089454921567, "ground_truth": 0}, {"key": "4160464d3fcba547cb1664e54ce51ad06f78b773", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.16667539189156438, "ground_truth": 0}, {"key": "4160464d3fcba547cb1664e54ce51ad06f78b773", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.7490871966075369, "ground_truth": 0}, {"key": "4160464d3fcba547cb1664e54ce51ad06f78b773", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.517570885578167, "ground_truth": 0}, {"key": "4160464d3fcba547cb1664e54ce51ad06f78b773", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.6876300019414544, "ground_truth": 0}, {"key": "72b396634cc46f29b5ef146a61073ee7e7fa3cdc", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.8365545640921459, "ground_truth": 0}, {"key": "72b396634cc46f29b5ef146a61073ee7e7fa3cdc", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.7826624840254318, "ground_truth": 0}, {"key": "72b396634cc46f29b5ef146a61073ee7e7fa3cdc", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.8749346107470285, "ground_truth": 0}, {"key": "72b396634cc46f29b5ef146a61073ee7e7fa3cdc", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.8322366702671864, "ground_truth": 0}, {"key": "72b396634cc46f29b5ef146a61073ee7e7fa3cdc", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.9005297768482525, "ground_truth": 0}, {"key": "b9b09b290cdf4d74cb64684a6cae8b6832645607", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.8244619371251419, "ground_truth": 0}, {"key": "b9b09b290cdf4d74cb64684a6cae8b6832645607", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.8984105436195284, "ground_truth": 0}, {"key": "b9b09b290cdf4d74cb64684a6cae8b6832645607", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.8244619344345832, "ground_truth": 0}, {"key": "b9b09b290cdf4d74cb64684a6cae8b6832645607", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.7431679997861527, "ground_truth": 0}, {"key": "b9b09b290cdf4d74cb64684a6cae8b6832645607", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.8824278598305909, "ground_truth": 0}, {"key": "9e49d58fa5ab7f3e4356cb61337605ac007c49ca", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.4148988273569742, "ground_truth": 0}, {"key": "9e49d58fa5ab7f3e4356cb61337605ac007c49ca", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.47463119653943875, "ground_truth": 0}, {"key": "9e49d58fa5ab7f3e4356cb61337605ac007c49ca", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.2643583715678699, "ground_truth": 0}, {"key": "9e49d58fa5ab7f3e4356cb61337605ac007c49ca", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.5794004056821153, "ground_truth": 0}, {"key": "9e49d58fa5ab7f3e4356cb61337605ac007c49ca", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.33982762591805626, "ground_truth": 0}, {"key": "47fe0e2bba8206014fb53a7d5247efd1e316e087", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.5945512596163987, "ground_truth": 0}, {"key": "47fe0e2bba8206014fb53a7d5247efd1e316e087", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.4054487327443157, "ground_truth": 0}, {"key": "47fe0e2bba8206014fb53a7d5247efd1e316e087", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.16026603636389972, "ground_truth": 0}, {"key": "47fe0e2bba8206014fb53a7d5247efd1e316e087", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.4668456098623191, "ground_truth": 0}, {"key": "47fe0e2bba8206014fb53a7d5247efd1e316e087", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.2351083803615146, "ground_truth": 0}, {"key": "f54f84affaebd1d86011ad31adbf9fac4754a8f2", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.36658975189761944, "ground_truth": 0}, {"key": "f54f84affaebd1d86011ad31adbf9fac4754a8f2", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.43206341697219436, "ground_truth": 0}, {"key": "f54f84affaebd1d86011ad31adbf9fac4754a8f2", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.6808786159899147, "ground_truth": 0}, {"key": "f54f84affaebd1d86011ad31adbf9fac4754a8f2", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.4726835049762114, "ground_truth": 0}, {"key": "f54f84affaebd1d86011ad31adbf9fac4754a8f2", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.6740504801505672, "ground_truth": 0}, {"key": "bc4992871e25e6584936af456ad4b819dcc52f27", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.7931059774308108, "ground_truth": 0}, {"key": "bc4992871e25e6584936af456ad4b819dcc52f27", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.8407825922098868, "ground_truth": 0}, {"key": "bc4992871e25e6584936af456ad4b819dcc52f27", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.7577943867535873, "ground_truth": 0}, {"key": "bc4992871e25e6584936af456ad4b819dcc52f27", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.668880246756496, "ground_truth": 0}, {"key": "bc4992871e25e6584936af456ad4b819dcc52f27", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.8354835289467908, "ground_truth": 0}, {"key": "271416bf0f15c52a4417339de78dcecf378b3950", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.7879311823210338, "ground_truth": 0}, {"key": "271416bf0f15c52a4417339de78dcecf378b3950", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.9294403995536801, "ground_truth": 0}, {"key": "271416bf0f15c52a4417339de78dcecf378b3950", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.7386690755912745, "ground_truth": 0}, {"key": "271416bf0f15c52a4417339de78dcecf378b3950", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.8116760129201184, "ground_truth": 0}, {"key": "271416bf0f15c52a4417339de78dcecf378b3950", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.8397339595926948, "ground_truth": 0}, {"key": "0add6b43e18072837f0bef41031d6f92f740d625", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.6039318480102097, "ground_truth": 0}, {"key": "0add6b43e18072837f0bef41031d6f92f740d625", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.707404713200515, "ground_truth": 0}, {"key": "0add6b43e18072837f0bef41031d6f92f740d625", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.7648915965706923, "ground_truth": 0}, {"key": "0add6b43e18072837f0bef41031d6f92f740d625", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.5486734771579024, "ground_truth": 0}, {"key": "0add6b43e18072837f0bef41031d6f92f740d625", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.8548846327174321, "ground_truth": 0}, {"key": "7060e3feb685bda7b5102e1cc8e9b35da37ca2a1", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.7905302911563609, "ground_truth": 0}, {"key": "7060e3feb685bda7b5102e1cc8e9b35da37ca2a1", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.6020615777410282, "ground_truth": 0}, {"key": "7060e3feb685bda7b5102e1cc8e9b35da37ca2a1", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.538983194002432, "ground_truth": 0}, {"key": "7060e3feb685bda7b5102e1cc8e9b35da37ca2a1", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.6477982221760081, "ground_truth": 0}, {"key": "7060e3feb685bda7b5102e1cc8e9b35da37ca2a1", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.5486735072735108, "ground_truth": 0}, {"key": "04fbd3088e8610dd4d5bea709e7cc5ee3e53710d", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.694302686553532, "ground_truth": 0}, {"key": "04fbd3088e8610dd4d5bea709e7cc5ee3e53710d", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.566018542461655, "ground_truth": 0}, {"key": "04fbd3088e8610dd4d5bea709e7cc5ee3e53710d", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.7217432086539021, "ground_truth": 0}, {"key": "04fbd3088e8610dd4d5bea709e7cc5ee3e53710d", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.5583270102492933, "ground_truth": 0}, {"key": "04fbd3088e8610dd4d5bea709e7cc5ee3e53710d", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.3923368406415129, "ground_truth": 0}, {"key": "b198f0356c0f0cb09aba4d7d5541dd7c5ce91678", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.8116760088569857, "ground_truth": 0}, {"key": "b198f0356c0f0cb09aba4d7d5541dd7c5ce91678", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.891054955090385, "ground_truth": 0}, {"key": "b198f0356c0f0cb09aba4d7d5541dd7c5ce91678", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.7759445611725351, "ground_truth": 0}, {"key": "b198f0356c0f0cb09aba4d7d5541dd7c5ce91678", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.618780414942993, "ground_truth": 0}, {"key": "b198f0356c0f0cb09aba4d7d5541dd7c5ce91678", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.837619960545085, "ground_truth": 0}, {"key": "0f60442453e038c6bbe3aa525bedf2a97f459e04", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.37754066071017733, "ground_truth": 0}, {"key": "0f60442453e038c6bbe3aa525bedf2a97f459e04", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.24220563968321757, "ground_truth": 0}, {"key": "0f60442453e038c6bbe3aa525bedf2a97f459e04", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.4073334200585735, "ground_truth": 0}, {"key": "0f60442453e038c6bbe3aa525bedf2a97f459e04", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.6706082868907501, "ground_truth": 0}, {"key": "0f60442453e038c6bbe3aa525bedf2a97f459e04", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.5019531310345501, "ground_truth": 0}, {"key": "79b423b90af6b3381ebfa34a7382ca472bdb5b35", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.5058591061575425, "ground_truth": 0}, {"key": "79b423b90af6b3381ebfa34a7382ca472bdb5b35", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.4785288308821309, "ground_truth": 0}, {"key": "79b423b90af6b3381ebfa34a7382ca472bdb5b35", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.4073334226189626, "ground_truth": 0}, {"key": "79b423b90af6b3381ebfa34a7382ca472bdb5b35", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.4035668804367485, "ground_truth": 0}, {"key": "79b423b90af6b3381ebfa34a7382ca472bdb5b35", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.2133771724018281, "ground_truth": 0}, {"key": "3e5a3a2dddee7ebebe57c12d0ace97a24cbabd72", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.7826624819653318, "ground_truth": 0}, {"key": "3e5a3a2dddee7ebebe57c12d0ace97a24cbabd72", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.5506073647271348, "ground_truth": 0}, {"key": "3e5a3a2dddee7ebebe57c12d0ace97a24cbabd72", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.7138307449168091, "ground_truth": 0}, {"key": "3e5a3a2dddee7ebebe57c12d0ace97a24cbabd72", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.5175708829872413, "ground_truth": 0}, {"key": "3e5a3a2dddee7ebebe57c12d0ace97a24cbabd72", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.620621607137338, "ground_truth": 0}, {"key": "c623e4914c04811d354fa137e3bf7a00980ef7d7", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.5389831990809877, "ground_truth": 0}, {"key": "c623e4914c04811d354fa137e3bf7a00980ef7d7", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.5117165981817591, "ground_truth": 0}, {"key": "c623e4914c04811d354fa137e3bf7a00980ef7d7", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.6334102566952341, "ground_truth": 0}, {"key": "c623e4914c04811d354fa137e3bf7a00980ef7d7", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.2689414460328347, "ground_truth": 0}, {"key": "c623e4914c04811d354fa137e3bf7a00980ef7d7", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.49414088268927386, "ground_truth": 0}, {"key": "d5ef1fb6f2df20e46fb032b9e318bc8555283e78", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.5851011700612166, "ground_truth": 0}, {"key": "d5ef1fb6f2df20e46fb032b9e318bc8555283e78", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.6187804101737898, "ground_truth": 0}, {"key": "d5ef1fb6f2df20e46fb032b9e318bc8555283e78", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.39606816098062714, "ground_truth": 0}, {"key": "d5ef1fb6f2df20e46fb032b9e318bc8555283e78", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.45326186132108875, "ground_truth": 0}, {"key": "d5ef1fb6f2df20e46fb032b9e318bc8555283e78", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.588889106051346, "ground_truth": 0}, {"key": "e1a36c50adadc5db9ffe6fd2c5e275d522902193", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.5312093511496913, "ground_truth": 0}, {"key": "e1a36c50adadc5db9ffe6fd2c5e275d522902193", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.6279512322308479, "ground_truth": 0}, {"key": "e1a36c50adadc5db9ffe6fd2c5e275d522902193", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.43782349658052017, "ground_truth": 0}, {"key": "e1a36c50adadc5db9ffe6fd2c5e275d522902193", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.579400425010915, "ground_truth": 0}, {"key": "e1a36c50adadc5db9ffe6fd2c5e275d522902193", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.6406358590352083, "ground_truth": 0}, {"key": "bad69c9a3c7d84a4717705a3063dd7367243772b", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.4455295297079115, "ground_truth": 0}, {"key": "bad69c9a3c7d84a4717705a3063dd7367243772b", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.7264256033105151, "ground_truth": 0}, {"key": "bad69c9a3c7d84a4717705a3063dd7367243772b", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.8418256564779337, "ground_truth": 0}, {"key": "bad69c9a3c7d84a4717705a3063dd7367243772b", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.5851011813280766, "ground_truth": 0}, {"key": "bad69c9a3c7d84a4717705a3063dd7367243772b", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.7826624874340572, "ground_truth": 0}, {"key": "4b40ad1f0e59b139e9a1466859ee08a048ca8d2c", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.3812195824386755, "ground_truth": 0}, {"key": "4b40ad1f0e59b139e9a1466859ee08a048ca8d2c", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.4629586114889866, "ground_truth": 0}, {"key": "4b40ad1f0e59b139e9a1466859ee08a048ca8d2c", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.46684561206511216, "ground_truth": 0}, {"key": "4b40ad1f0e59b139e9a1466859ee08a048ca8d2c", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.6757645942332752, "ground_truth": 0}, {"key": "4b40ad1f0e59b139e9a1466859ee08a048ca8d2c", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.4649015897205454, "ground_truth": 0}, {"key": "c17a30b4c0f8f58e3afa6279a39470f65a179f6b", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.2942149533941398, "ground_truth": 0}, {"key": "c17a30b4c0f8f58e3afa6279a39470f65a179f6b", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.32594952021865736, "ground_truth": 0}, {"key": "c17a30b4c0f8f58e3afa6279a39470f65a179f6b", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.2407745922712992, "ground_truth": 0}, {"key": "c17a30b4c0f8f58e3afa6279a39470f65a179f6b", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.27202455802002745, "ground_truth": 0}, {"key": "c17a30b4c0f8f58e3afa6279a39470f65a179f6b", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.20946967479501125, "ground_truth": 0}, {"key": "6f579aad2d1f601b17e01057cd4b5e4942627230", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.5679365913982022, "ground_truth": 0}, {"key": "6f579aad2d1f601b17e01057cd4b5e4942627230", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.6740504990343678, "ground_truth": 0}, {"key": "6f579aad2d1f601b17e01057cd4b5e4942627230", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.5253688367892217, "ground_truth": 0}, {"key": "6f579aad2d1f601b17e01057cd4b5e4942627230", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.6020616086510179, "ground_truth": 0}, {"key": "6f579aad2d1f601b17e01057cd4b5e4942627230", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.5563995639827123, "ground_truth": 0}, {"key": "7551f8e13485bb1738c16eccad343a14a47b2903", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.8670357673732625, "ground_truth": 0}, {"key": "7551f8e13485bb1738c16eccad343a14a47b2903", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.8757869936717639, "ground_truth": 0}, {"key": "7551f8e13485bb1738c16eccad343a14a47b2903", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.6688802511538221, "ground_truth": 0}, {"key": "7551f8e13485bb1738c16eccad343a14a47b2903", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.8615382063498005, "ground_truth": 0}, {"key": "7551f8e13485bb1738c16eccad343a14a47b2903", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.8816149018299383, "ground_truth": 0}, {"key": "257d8d38863175ec9401d0532963fb71a47f0734", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.7577943690179065, "ground_truth": 0}, {"key": "257d8d38863175ec9401d0532963fb71a47f0734", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.6774740167344603, "ground_truth": 0}, {"key": "257d8d38863175ec9401d0532963fb71a47f0734", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.5214711354669088, "ground_truth": 0}, {"key": "257d8d38863175ec9401d0532963fb71a47f0734", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.7592254023705177, "ground_truth": 0}, {"key": "257d8d38863175ec9401d0532963fb71a47f0734", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.5964331265309208, "ground_truth": 0}, {"key": "aa596e10dfe78dd875a7e15bfd53138bc8bde471", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.3504213670467204, "ground_truth": 0}, {"key": "aa596e10dfe78dd875a7e15bfd53138bc8bde471", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.2213506822911846, "ground_truth": 0}, {"key": "aa596e10dfe78dd875a7e15bfd53138bc8bde471", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.221350685582271, "ground_truth": 0}, {"key": "aa596e10dfe78dd875a7e15bfd53138bc8bde471", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.10743747529962276, "ground_truth": 0}, {"key": "aa596e10dfe78dd875a7e15bfd53138bc8bde471", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.2379299028337493, "ground_truth": 0}, {"key": "a0dff972172125f32b79977a47b0d250be8f71e4", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.6740504716324586, "ground_truth": 0}, {"key": "a0dff972172125f32b79977a47b0d250be8f71e4", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.7217432118507884, "ground_truth": 0}, {"key": "a0dff972172125f32b79977a47b0d250be8f71e4", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.4863315698962051, "ground_truth": 0}, {"key": "a0dff972172125f32b79977a47b0d250be8f71e4", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.5253688071207878, "ground_truth": 0}, {"key": "a0dff972172125f32b79977a47b0d250be8f71e4", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.6909762933820376, "ground_truth": 0}, {"key": "faac3a6337907b1552b7068c8701cae665c4885c", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.6169358453395158, "ground_truth": 0}, {"key": "faac3a6337907b1552b7068c8701cae665c4885c", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.762070113102335, "ground_truth": 0}, {"key": "faac3a6337907b1552b7068c8701cae665c4885c", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.8499711555564908, "ground_truth": 0}, {"key": "faac3a6337907b1552b7068c8701cae665c4885c", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.782662495139688, "ground_truth": 0}, {"key": "faac3a6337907b1552b7068c8701cae665c4885c", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.769080248707308, "ground_truth": 0}, {"key": "c741b211364d761605050776064a506d24378d10", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.6619228786949348, "ground_truth": 0}, {"key": "c741b211364d761605050776064a506d24378d10", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.727975451940261, "ground_truth": 0}, {"key": "c741b211364d761605050776064a506d24378d10", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.5253688237283551, "ground_truth": 0}, {"key": "c741b211364d761605050776064a506d24378d10", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.7401743446502203, "ground_truth": 0}, {"key": "c741b211364d761605050776064a506d24378d10", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.39420094214861257, "ground_truth": 0}, {"key": "a062b8ba08369be2364a863020a28de63a3cbf86", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.7310585590307875, "ground_truth": 0}, {"key": "a062b8ba08369be2364a863020a28de63a3cbf86", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.6584175042870752, "ground_truth": 0}, {"key": "a062b8ba08369be2364a863020a28de63a3cbf86", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.43782349041484847, "ground_truth": 0}, {"key": "a062b8ba08369be2364a863020a28de63a3cbf86", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.4980468592945388, "ground_truth": 0}, {"key": "a062b8ba08369be2364a863020a28de63a3cbf86", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.5736784046309684, "ground_truth": 0}, {"key": "f11102404d23702fe398b1d690d13418703e617a", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.963779946875962, "ground_truth": 0}, {"key": "f11102404d23702fe398b1d690d13418703e617a", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.9801292846467305, "ground_truth": 0}, {"key": "f11102404d23702fe398b1d690d13418703e617a", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.9594592646816904, "ground_truth": 0}, {"key": "f11102404d23702fe398b1d690d13418703e617a", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.9901401454589808, "ground_truth": 0}, {"key": "f11102404d23702fe398b1d690d13418703e617a", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.974239441677033, "ground_truth": 0}, {"key": "62481fda7e7b9714b994617909349550707fe8a7", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.7520125647929607, "ground_truth": 0}, {"key": "62481fda7e7b9714b994617909349550707fe8a7", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.7905303102698281, "ground_truth": 0}, {"key": "62481fda7e7b9714b994617909349550707fe8a7", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.8489721973814154, "ground_truth": 0}, {"key": "62481fda7e7b9714b994617909349550707fe8a7", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.800691998666432, "ground_truth": 0}, {"key": "62481fda7e7b9714b994617909349550707fe8a7", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.7662936532669269, "ground_truth": 0}, {"key": "13943ef2d9c3b737c9a900f0cdb32a9c39121e6f", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.894789461113077, "ground_truth": 0}, {"key": "13943ef2d9c3b737c9a900f0cdb32a9c39121e6f", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.9416541613432021, "ground_truth": 0}, {"key": "13943ef2d9c3b737c9a900f0cdb32a9c39121e6f", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.7592254047737228, "ground_truth": 0}, {"key": "13943ef2d9c3b737c9a900f0cdb32a9c39121e6f", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.8732148248025544, "ground_truth": 0}, {"key": "13943ef2d9c3b737c9a900f0cdb32a9c39121e6f", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.8918110489944199, "ground_truth": 0}, {"key": "0c25e0cd62589fde1b378606febbcc5a2bafc770", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.941223443643391, "ground_truth": 0}, {"key": "0c25e0cd62589fde1b378606febbcc5a2bafc770", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.9190632940000503, "ground_truth": 0}, {"key": "0c25e0cd62589fde1b378606febbcc5a2bafc770", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.9381240116372599, "ground_truth": 0}, {"key": "0c25e0cd62589fde1b378606febbcc5a2bafc770", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.9155072508461704, "ground_truth": 0}, {"key": "0c25e0cd62589fde1b378606febbcc5a2bafc770", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.8344068774231365, "ground_truth": 0}, {"key": "a86bc16fad35d84e988af4cc64bf14877337d47e", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.7866228173267439, "ground_truth": 0}, {"key": "a86bc16fad35d84e988af4cc64bf14877337d47e", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.8128673084966364, "ground_truth": 0}, {"key": "a86bc16fad35d84e988af4cc64bf14877337d47e", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.7786493282368186, "ground_truth": 0}, {"key": "a86bc16fad35d84e988af4cc64bf14877337d47e", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.7008948006378782, "ground_truth": 0}, {"key": "a86bc16fad35d84e988af4cc64bf14877337d47e", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.7648915931374147, "ground_truth": 0}, {"key": "0f937bcc8cd07bab2d5aa9a4492d3c2430063b67", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.6825737312803627, "ground_truth": 0}, {"key": "0f937bcc8cd07bab2d5aa9a4492d3c2430063b67", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.7905303055533671, "ground_truth": 0}, {"key": "0f937bcc8cd07bab2d5aa9a4492d3c2430063b67", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.9213576219858075, "ground_truth": 0}, {"key": "0f937bcc8cd07bab2d5aa9a4492d3c2430063b67", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.5563995842057868, "ground_truth": 0}, {"key": "0f937bcc8cd07bab2d5aa9a4492d3c2430063b67", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.6636689539169994, "ground_truth": 0}, {"key": "a6c0617d92807f05f02d767261c45b616382e499", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.6352224377686643, "ground_truth": 0}, {"key": "a6c0617d92807f05f02d767261c45b616382e499", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.7786493352210405, "ground_truth": 0}, {"key": "a6c0617d92807f05f02d767261c45b616382e499", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.5583269802492299, "ground_truth": 0}, {"key": "a6c0617d92807f05f02d767261c45b616382e499", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.682573705327567, "ground_truth": 0}, {"key": "a6c0617d92807f05f02d767261c45b616382e499", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.7549150016816276, "ground_truth": 0}, {"key": "4f45a0576d353fa9b5b9d1c8e3cc0e6a1cd4897b", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.4902356150389894, "ground_truth": 0}, {"key": "4f45a0576d353fa9b5b9d1c8e3cc0e6a1cd4897b", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.46879063381354086, "ground_truth": 0}, {"key": "4f45a0576d353fa9b5b9d1c8e3cc0e6a1cd4897b", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.48633153829387354, "ground_truth": 0}, {"key": "4f45a0576d353fa9b5b9d1c8e3cc0e6a1cd4897b", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.7310585572363765, "ground_truth": 0}, {"key": "4f45a0576d353fa9b5b9d1c8e3cc0e6a1cd4897b", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.598312183005329, "ground_truth": 0}, {"key": "f6d43a207c2b3c48e787087b345c23d2fb1dc92f", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.939470611441811, "ground_truth": 0}, {"key": "f6d43a207c2b3c48e787087b345c23d2fb1dc92f", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.7704647909063792, "ground_truth": 0}, {"key": "f6d43a207c2b3c48e787087b345c23d2fb1dc92f", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.7490872073701954, "ground_truth": 0}, {"key": "f6d43a207c2b3c48e787087b345c23d2fb1dc92f", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.7549149947844476, "ground_truth": 0}, {"key": "f6d43a207c2b3c48e787087b345c23d2fb1dc92f", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.8624675363375793, "ground_truth": 0}, {"key": "e0127487aee3a00fe164d72eb697221079518471", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.5389832062997071, "ground_truth": 0}, {"key": "e0127487aee3a00fe164d72eb697221079518471", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.6495786244368257, "ground_truth": 0}, {"key": "e0127487aee3a00fe164d72eb697221079518471", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.6187804423237946, "ground_truth": 0}, {"key": "e0127487aee3a00fe164d72eb697221079518471", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.6584175083297362, "ground_truth": 0}, {"key": "e0127487aee3a00fe164d72eb697221079518471", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.5136684602597347, "ground_truth": 0}, {"key": "2f3af8decce1c0a6cd22b21df96acd40b14bb62b", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.17781087351342195, "ground_truth": 0}, {"key": "2f3af8decce1c0a6cd22b21df96acd40b14bb62b", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.4746311802065733, "ground_truth": 0}, {"key": "2f3af8decce1c0a6cd22b21df96acd40b14bb62b", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.23651625316553695, "ground_truth": 0}, {"key": "2f3af8decce1c0a6cd22b21df96acd40b14bb62b", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.18126320693280112, "ground_truth": 0}, {"key": "2f3af8decce1c0a6cd22b21df96acd40b14bb62b", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.5234203520181562, "ground_truth": 0}, {"key": "13a366f303e6ea2f07c353a9f5fb49a44840f808", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.7866228160964843, "ground_truth": 0}, {"key": "13a366f303e6ea2f07c353a9f5fb49a44840f808", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.856812311429652, "ground_truth": 0}, {"key": "13a366f303e6ea2f07c353a9f5fb49a44840f808", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.8407825941171813, "ground_truth": 0}, {"key": "13a366f303e6ea2f07c353a9f5fb49a44840f808", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.8080672250421903, "ground_truth": 0}, {"key": "13a366f303e6ea2f07c353a9f5fb49a44840f808", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.9309620754989149, "ground_truth": 0}, {"key": "ee36a8b5db09b9e9a6d462116539ffc095d5c017", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.56217650254414, "ground_truth": 0}, {"key": "ee36a8b5db09b9e9a6d462116539ffc095d5c017", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.7264256090237853, "ground_truth": 0}, {"key": "ee36a8b5db09b9e9a6d462116539ffc095d5c017", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.6654105630357201, "ground_truth": 0}, {"key": "ee36a8b5db09b9e9a6d462116539ffc095d5c017", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.8633916084467123, "ground_truth": 0}, {"key": "ee36a8b5db09b9e9a6d462116539ffc095d5c017", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.7057850186745884, "ground_truth": 0}, {"key": "d3b3bcf90226a694361cb27f1a4d481c79b7368a", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.6842640196808052, "ground_truth": 0}, {"key": "d3b3bcf90226a694361cb27f1a4d481c79b7368a", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.6791787010460301, "ground_truth": 0}, {"key": "d3b3bcf90226a694361cb27f1a4d481c79b7368a", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.700894824497983, "ground_truth": 0}, {"key": "d3b3bcf90226a694361cb27f1a4d481c79b7368a", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.7248702879250496, "ground_truth": 0}, {"key": "d3b3bcf90226a694361cb27f1a4d481c79b7368a", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.7505527582103446, "ground_truth": 0}, {"key": "e5e837f2cc75fc44ebf826822aa4c9dc59344b8b", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.4073334093076622, "ground_truth": 0}, {"key": "e5e837f2cc75fc44ebf826822aa4c9dc59344b8b", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.7279754306546595, "ground_truth": 0}, {"key": "e5e837f2cc75fc44ebf826822aa4c9dc59344b8b", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.6169358464046826, "ground_truth": 0}, {"key": "e5e837f2cc75fc44ebf826822aa4c9dc59344b8b", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.613236556067238, "ground_truth": 0}, {"key": "e5e837f2cc75fc44ebf826822aa4c9dc59344b8b", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.42059958502832484, "ground_truth": 0}, {"key": "1317a869cc1d6d534a93eaad67fb6550aa155ae6", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.3398276370351032, "ground_truth": 0}, {"key": "1317a869cc1d6d534a93eaad67fb6550aa155ae6", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.31069438256557014, "ground_truth": 0}, {"key": "1317a869cc1d6d534a93eaad67fb6550aa155ae6", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.4339814757624905, "ground_truth": 0}, {"key": "1317a869cc1d6d534a93eaad67fb6550aa155ae6", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.3433417253732486, "ground_truth": 0}, {"key": "1317a869cc1d6d534a93eaad67fb6550aa155ae6", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.35577489409748775, "ground_truth": 0}, {"key": "f856ca4cd15992e0e88ae9113bf31b2a5ab55072", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.8479677622961319, "ground_truth": 0}, {"key": "f856ca4cd15992e0e88ae9113bf31b2a5ab55072", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.9394706128007762, "ground_truth": 0}, {"key": "f856ca4cd15992e0e88ae9113bf31b2a5ab55072", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.9399133500542295, "ground_truth": 0}, {"key": "f856ca4cd15992e0e88ae9113bf31b2a5ab55072", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.9314625064891583, "ground_truth": 0}, {"key": "f856ca4cd15992e0e88ae9113bf31b2a5ab55072", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.7074047101817059, "ground_truth": 0}, {"key": "438e8eaa1c64cb59288f9954355d0100181d19a2", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.9284087929632089, "ground_truth": 0}, {"key": "438e8eaa1c64cb59288f9954355d0100181d19a2", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.6601723889646064, "ground_truth": 0}, {"key": "438e8eaa1c64cb59288f9954355d0100181d19a2", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.7853085848099546, "ground_truth": 0}, {"key": "438e8eaa1c64cb59288f9954355d0100181d19a2", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.8152324837692836, "ground_truth": 0}, {"key": "438e8eaa1c64cb59288f9954355d0100181d19a2", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.6909762857671305, "ground_truth": 0}, {"key": "470618f9fd48a5d134a44b5de166b625f596a0b3", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.478528853753311, "ground_truth": 0}, {"key": "470618f9fd48a5d134a44b5de166b625f596a0b3", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.8198933433718611, "ground_truth": 0}, {"key": "470618f9fd48a5d134a44b5de166b625f596a0b3", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.7879311965808645, "ground_truth": 0}, {"key": "470618f9fd48a5d134a44b5de166b625f596a0b3", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.6095241612037439, "ground_truth": 0}, {"key": "470618f9fd48a5d134a44b5de166b625f596a0b3", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.6825737132702204, "ground_truth": 0}, {"key": "751e8f720d24c57e79cf63d9a3f72cd80c5d9619", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.46295859044047216, "ground_truth": 0}, {"key": "751e8f720d24c57e79cf63d9a3f72cd80c5d9619", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.6757646059014518, "ground_truth": 0}, {"key": "751e8f720d24c57e79cf63d9a3f72cd80c5d9619", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.3998116580608953, "ground_truth": 0}, {"key": "751e8f720d24c57e79cf63d9a3f72cd80c5d9619", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.5832033461370654, "ground_truth": 0}, {"key": "751e8f720d24c57e79cf63d9a3f72cd80c5d9619", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.45519859375437743, "ground_truth": 0}, {"key": "6a985a1090f146976d33c8b33342320a65a50211", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.5350984150068058, "ground_truth": 0}, {"key": "6a985a1090f146976d33c8b33342320a65a50211", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.276690531563782, "ground_truth": 0}, {"key": "6a985a1090f146976d33c8b33342320a65a50211", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.25982561674927024, "ground_truth": 0}, {"key": "6a985a1090f146976d33c8b33342320a65a50211", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.43206340518562814, "ground_truth": 0}, {"key": "6a985a1090f146976d33c8b33342320a65a50211", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.4532618519894885, "ground_truth": 0}, {"key": "4640d2f968f31bcf384d8253e055611b10f4a38b", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.42441199565544807, "ground_truth": 0}, {"key": "4640d2f968f31bcf384d8253e055611b10f4a38b", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.4960938269766179, "ground_truth": 0}, {"key": "4640d2f968f31bcf384d8253e055611b10f4a38b", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.300745595057271, "ground_truth": 0}, {"key": "4640d2f968f31bcf384d8253e055611b10f4a38b", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.26894143131908366, "ground_truth": 0}, {"key": "4640d2f968f31bcf384d8253e055611b10f4a38b", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.5370413789243178, "ground_truth": 0}, {"key": "22e0c9ba3465840583a5fd79714d2f7663c7e3a1", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.7732163751174578, "ground_truth": 0}, {"key": "22e0c9ba3465840583a5fd79714d2f7663c7e3a1", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.8233283889004137, "ground_truth": 0}, {"key": "22e0c9ba3465840583a5fd79714d2f7663c7e3a1", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.5312093535316947, "ground_truth": 0}, {"key": "22e0c9ba3465840583a5fd79714d2f7663c7e3a1", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.7732163795300694, "ground_truth": 0}, {"key": "22e0c9ba3465840583a5fd79714d2f7663c7e3a1", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.8879840442807695, "ground_truth": 0}, {"key": "10dafcc21761c60f8fc5bd832daf8f21cf0fc66d", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.5755879855441073, "ground_truth": 0}, {"key": "10dafcc21761c60f8fc5bd832daf8f21cf0fc66d", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.40356688017489944, "ground_truth": 0}, {"key": "10dafcc21761c60f8fc5bd832daf8f21cf0fc66d", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.4225046161552723, "ground_truth": 0}, {"key": "10dafcc21761c60f8fc5bd832daf8f21cf0fc66d", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.3451052808606081, "ground_truth": 0}, {"key": "10dafcc21761c60f8fc5bd832daf8f21cf0fc66d", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.5331543710419928, "ground_truth": 0}, {"key": "75da85a72e0028e1b07c65f6b771a1eaa20b4e04", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.6706083158536132, "ground_truth": 0}, {"key": "75da85a72e0028e1b07c65f6b771a1eaa20b4e04", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.41869693145189424, "ground_truth": 0}, {"key": "75da85a72e0028e1b07c65f6b771a1eaa20b4e04", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.6406358728640772, "ground_truth": 0}, {"key": "75da85a72e0028e1b07c65f6b771a1eaa20b4e04", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.6943026868327564, "ground_truth": 0}, {"key": "75da85a72e0028e1b07c65f6b771a1eaa20b4e04", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.8056321893224353, "ground_truth": 0}, {"key": "9166b4c77e919f7a7cc457f9df981512dea3694f", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.845942439134794, "ground_truth": 0}, {"key": "9166b4c77e919f7a7cc457f9df981512dea3694f", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.4092207880359498, "ground_truth": 0}, {"key": "9166b4c77e919f7a7cc457f9df981512dea3694f", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.6842640310849533, "ground_truth": 0}, {"key": "9166b4c77e919f7a7cc457f9df981512dea3694f", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.6224593237132013, "ground_truth": 0}, {"key": "9166b4c77e919f7a7cc457f9df981512dea3694f", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.8080672219921834, "ground_truth": 0}, {"key": "81e50c6cdbea4e55af6307d653135ef395b6d7fe", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.7704647736549779, "ground_truth": 0}, {"key": "81e50c6cdbea4e55af6307d653135ef395b6d7fe", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.8991213859449334, "ground_truth": 0}, {"key": "81e50c6cdbea4e55af6307d653135ef395b6d7fe", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.9111797066449421, "ground_truth": 0}, {"key": "81e50c6cdbea4e55af6307d653135ef395b6d7fe", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.6808785651012469, "ground_truth": 0}, {"key": "81e50c6cdbea4e55af6307d653135ef395b6d7fe", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.8499711776978424, "ground_truth": 0}, {"key": "59fa6c3439d216272cc845d35627f8eb11b08a6d", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.9263037327468329, "ground_truth": 0}, {"key": "59fa6c3439d216272cc845d35627f8eb11b08a6d", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.951863228459683, "ground_truth": 0}, {"key": "59fa6c3439d216272cc845d35627f8eb11b08a6d", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.8587185747083149, "ground_truth": 0}, {"key": "59fa6c3439d216272cc845d35627f8eb11b08a6d", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.8918110538781945, "ground_truth": 0}, {"key": "59fa6c3439d216272cc845d35627f8eb11b08a6d", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.9348724564095974, "ground_truth": 0}, {"key": "2eff3ba44cfaefbff89ebc764828ae9e4d477c9b", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.7704647931640293, "ground_truth": 0}, {"key": "2eff3ba44cfaefbff89ebc764828ae9e4d477c9b", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.7386690730907612, "ground_truth": 0}, {"key": "2eff3ba44cfaefbff89ebc764828ae9e4d477c9b", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.7217432015732678, "ground_truth": 0}, {"key": "2eff3ba44cfaefbff89ebc764828ae9e4d477c9b", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.7620701055009851, "ground_truth": 0}, {"key": "2eff3ba44cfaefbff89ebc764828ae9e4d477c9b", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.7325918360049282, "ground_truth": 0}, {"key": "74698ee383888faf5a49b32ecb8211b888270b76", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.42250462686406426, "ground_truth": 0}, {"key": "74698ee383888faf5a49b32ecb8211b888270b76", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.7170118752266621, "ground_truth": 0}, {"key": "74698ee383888faf5a49b32ecb8211b888270b76", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.6020615854343673, "ground_truth": 0}, {"key": "74698ee383888faf5a49b32ecb8211b888270b76", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.6548947106296057, "ground_truth": 0}, {"key": "74698ee383888faf5a49b32ecb8211b888270b76", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.35756752449381624, "ground_truth": 0}, {"key": "79a6d24f452d8c1cef47ab224fd2083b0d08324c", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.8529354734209498, "ground_truth": 0}, {"key": "79a6d24f452d8c1cef47ab224fd2083b0d08324c", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.8449215345844683, "ground_truth": 0}, {"key": "79a6d24f452d8c1cef47ab224fd2083b0d08324c", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.7853085746447456, "ground_truth": 0}, {"key": "79a6d24f452d8c1cef47ab224fd2083b0d08324c", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.7170118975116802, "ground_truth": 0}, {"key": "79a6d24f452d8c1cef47ab224fd2083b0d08324c", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.8529354754101489, "ground_truth": 0}, {"key": "50f2041a2bed7f316d3254192c4158095eeec2e9", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.3575675194154425, "ground_truth": 0}, {"key": "50f2041a2bed7f316d3254192c4158095eeec2e9", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.3380771404680344, "ground_truth": 0}, {"key": "50f2041a2bed7f316d3254192c4158095eeec2e9", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.3942009441920175, "ground_truth": 0}, {"key": "50f2041a2bed7f316d3254192c4158095eeec2e9", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.355774866000377, "ground_truth": 0}, {"key": "50f2041a2bed7f316d3254192c4158095eeec2e9", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.4186969235610932, "ground_truth": 0}, {"key": "de6ed8db6d639706f2c5015c699fc578e4aa43ec", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.5370413796426133, "ground_truth": 0}, {"key": "de6ed8db6d639706f2c5015c699fc578e4aa43ec", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.5983121905459748, "ground_truth": 0}, {"key": "de6ed8db6d639706f2c5015c699fc578e4aa43ec", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.7634837566082988, "ground_truth": 0}, {"key": "de6ed8db6d639706f2c5015c699fc578e4aa43ec", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.5926666041725199, "ground_truth": 0}, {"key": "de6ed8db6d639706f2c5015c699fc578e4aa43ec", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.6352224373394016, "ground_truth": 0}, {"key": "8abb66a9697a8c59348fcc79de126691e394bded", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.8311430528529987, "ground_truth": 0}, {"key": "8abb66a9697a8c59348fcc79de126691e394bded", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.6876299933885043, "ground_truth": 0}, {"key": "8abb66a9697a8c59348fcc79de126691e394bded", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.8902942208633091, "ground_truth": 0}, {"key": "8abb66a9697a8c59348fcc79de126691e394bded", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.8925625264247912, "ground_truth": 0}, {"key": "8abb66a9697a8c59348fcc79de126691e394bded", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.7839884654316157, "ground_truth": 0}, {"key": "11ec3be451b57e4312b44eeabb3ae441435c662e", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.7931059589493487, "ground_truth": 0}, {"key": "11ec3be451b57e4312b44eeabb3ae441435c662e", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.8092759816047432, "ground_truth": 0}, {"key": "11ec3be451b57e4312b44eeabb3ae441435c662e", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.6370307813439758, "ground_truth": 0}, {"key": "11ec3be451b57e4312b44eeabb3ae441435c662e", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.7008948248203603, "ground_truth": 0}, {"key": "11ec3be451b57e4312b44eeabb3ae441435c662e", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.8840392833523268, "ground_truth": 0}, {"key": "eed527dece78deffed54a7cdd8516c4d57a90011", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.8856314681809465, "ground_truth": 0}, {"key": "eed527dece78deffed54a7cdd8516c4d57a90011", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.8428631472891176, "ground_truth": 0}, {"key": "eed527dece78deffed54a7cdd8516c4d57a90011", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.7201714967972603, "ground_truth": 0}, {"key": "eed527dece78deffed54a7cdd8516c4d57a90011", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.881614904168442, "ground_truth": 0}, {"key": "eed527dece78deffed54a7cdd8516c4d57a90011", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.9130583419980814, "ground_truth": 0}, {"key": "803c0dc8b3d2eb528fd084b613dfc29d98151d72", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.6671476662546577, "ground_truth": 0}, {"key": "803c0dc8b3d2eb528fd084b613dfc29d98151d72", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.7690802399097411, "ground_truth": 0}, {"key": "803c0dc8b3d2eb528fd084b613dfc29d98151d72", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.5234203522118627, "ground_truth": 0}, {"key": "803c0dc8b3d2eb528fd084b613dfc29d98151d72", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.7759445415474603, "ground_truth": 0}, {"key": "803c0dc8b3d2eb528fd084b613dfc29d98151d72", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.6548947140044186, "ground_truth": 0}, {"key": "d4fb4cca753c0f5586bd93bb124b0491711396d9", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.677474020713534, "ground_truth": 0}, {"key": "d4fb4cca753c0f5586bd93bb124b0491711396d9", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.7994423181837592, "ground_truth": 0}, {"key": "d4fb4cca753c0f5586bd93bb124b0491711396d9", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.45519861037367815, "ground_truth": 0}, {"key": "d4fb4cca753c0f5586bd93bb124b0491711396d9", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.47268346669515554, "ground_truth": 0}, {"key": "d4fb4cca753c0f5586bd93bb124b0491711396d9", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.5907791972383809, "ground_truth": 0}, {"key": "723443b1c16e2276a1aa03259a600044e86c2538", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.7185943883155753, "ground_truth": 0}, {"key": "723443b1c16e2276a1aa03259a600044e86c2538", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.7431680144135014, "ground_truth": 0}, {"key": "723443b1c16e2276a1aa03259a600044e86c2538", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.8322366540030374, "ground_truth": 0}, {"key": "723443b1c16e2276a1aa03259a600044e86c2538", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.7931059646022559, "ground_truth": 0}, {"key": "723443b1c16e2276a1aa03259a600044e86c2538", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.7892337058252271, "ground_truth": 0}, {"key": "b30a8f4dbb4f8375a8a9c2ccb4f658cc66dca0f5", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.49218815150553097, "ground_truth": 0}, {"key": "b30a8f4dbb4f8375a8a9c2ccb4f658cc66dca0f5", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.35577487267407293, "ground_truth": 0}, {"key": "b30a8f4dbb4f8375a8a9c2ccb4f658cc66dca0f5", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.6132365559788597, "ground_truth": 0}, {"key": "b30a8f4dbb4f8375a8a9c2ccb4f658cc66dca0f5", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.3539863139308422, "ground_truth": 0}, {"key": "b30a8f4dbb4f8375a8a9c2ccb4f658cc66dca0f5", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.4746311870274707, "ground_truth": 0}, {"key": "f874dc1da36d2c45a65f78dc0dc9dcdf5846c3c9", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.3812195680325822, "ground_truth": 0}, {"key": "f874dc1da36d2c45a65f78dc0dc9dcdf5846c3c9", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.6791787093435975, "ground_truth": 0}, {"key": "f874dc1da36d2c45a65f78dc0dc9dcdf5846c3c9", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.5679366145134315, "ground_truth": 0}, {"key": "f874dc1da36d2c45a65f78dc0dc9dcdf5846c3c9", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.5039061598441011, "ground_truth": 0}, {"key": "f874dc1da36d2c45a65f78dc0dc9dcdf5846c3c9", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.5370414016483278, "ground_truth": 0}, {"key": "60fc2801c429858cc0a87e547f1c30e34a7a96f3", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.6460136908390618, "ground_truth": 0}, {"key": "60fc2801c429858cc0a87e547f1c30e34a7a96f3", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.7233094708252004, "ground_truth": 0}, {"key": "60fc2801c429858cc0a87e547f1c30e34a7a96f3", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.707404705265823, "ground_truth": 0}, {"key": "60fc2801c429858cc0a87e547f1c30e34a7a96f3", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.8489721904805146, "ground_truth": 0}, {"key": "60fc2801c429858cc0a87e547f1c30e34a7a96f3", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.7008948045118063, "ground_truth": 0}, {"key": "d885b755dab03a11c7e3b19455b82859a6e1f76b", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.5774953711429344, "ground_truth": 0}, {"key": "d885b755dab03a11c7e3b19455b82859a6e1f76b", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.7866228333183546, "ground_truth": 0}, {"key": "d885b755dab03a11c7e3b19455b82859a6e1f76b", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.47657964472961317, "ground_truth": 0}, {"key": "d885b755dab03a11c7e3b19455b82859a6e1f76b", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.6039318332656483, "ground_truth": 0}, {"key": "d885b755dab03a11c7e3b19455b82859a6e1f76b", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.672331698208986, "ground_truth": 0}, {"key": "9ce486aae2ad61c78b2e44d2617276a470c9f600", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.45519860298933623, "ground_truth": 0}, {"key": "9ce486aae2ad61c78b2e44d2617276a470c9f600", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.6808786210418527, "ground_truth": 0}, {"key": "9ce486aae2ad61c78b2e44d2617276a470c9f600", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.7446563515490009, "ground_truth": 0}, {"key": "9ce486aae2ad61c78b2e44d2617276a470c9f600", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.3073580102299204, "ground_truth": 0}, {"key": "9ce486aae2ad61c78b2e44d2617276a470c9f600", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.5370414059847161, "ground_truth": 0}, {"key": "162e54974cad1d0e067a97e37175951c26f13a0e", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.8365545663708935, "ground_truth": 0}, {"key": "162e54974cad1d0e067a97e37175951c26f13a0e", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.71701186666297, "ground_truth": 0}, {"key": "162e54974cad1d0e067a97e37175951c26f13a0e", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.8652240885435087, "ground_truth": 0}, {"key": "162e54974cad1d0e067a97e37175951c26f13a0e", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.8723473890790681, "ground_truth": 0}, {"key": "162e54974cad1d0e067a97e37175951c26f13a0e", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.8991213787165098, "ground_truth": 0}, {"key": "03a0cef9c902928979ef731616fb96bd1fb10f9f", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.7577943644089418, "ground_truth": 0}, {"key": "03a0cef9c902928979ef731616fb96bd1fb10f9f", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.8856314791223608, "ground_truth": 0}, {"key": "03a0cef9c902928979ef731616fb96bd1fb10f9f", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.8044059262111907, "ground_truth": 0}, {"key": "03a0cef9c902928979ef731616fb96bd1fb10f9f", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.8289388276157997, "ground_truth": 0}, {"key": "03a0cef9c902928979ef731616fb96bd1fb10f9f", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.5774953766270019, "ground_truth": 0}, {"key": "6f64897fc65e1ba7531a4830a7d935ab15d8bec6", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.644225109463259, "ground_truth": 0}, {"key": "6f64897fc65e1ba7531a4830a7d935ab15d8bec6", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.36840570139678985, "ground_truth": 0}, {"key": "6f64897fc65e1ba7531a4830a7d935ab15d8bec6", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.689305608646507, "ground_truth": 0}, {"key": "6f64897fc65e1ba7531a4830a7d935ab15d8bec6", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.45907613208700904, "ground_truth": 0}, {"key": "6f64897fc65e1ba7531a4830a7d935ab15d8bec6", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.39981166298897775, "ground_truth": 0}, {"key": "0d7383a44955b41c5a472151a35a842751f0004c", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.4378234860946328, "ground_truth": 0}, {"key": "0d7383a44955b41c5a472151a35a842751f0004c", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.4649015728268646, "ground_truth": 0}, {"key": "0d7383a44955b41c5a472151a35a842751f0004c", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.32252599024788414, "ground_truth": 0}, {"key": "0d7383a44955b41c5a472151a35a842751f0004c", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.6132365741294279, "ground_truth": 0}, {"key": "0d7383a44955b41c5a472151a35a842751f0004c", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.6424324654033478, "ground_truth": 0}, {"key": "2fddefe691f7849048548a15f6533339d4a25bfd", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.6442251185864863, "ground_truth": 0}, {"key": "2fddefe691f7849048548a15f6533339d4a25bfd", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.6095241570271624, "ground_truth": 0}, {"key": "2fddefe691f7849048548a15f6533339d4a25bfd", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.5832033596007385, "ground_truth": 0}, {"key": "2fddefe691f7849048548a15f6533339d4a25bfd", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.7310585651776829, "ground_truth": 0}, {"key": "2fddefe691f7849048548a15f6533339d4a25bfd", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.5621765101524347, "ground_truth": 0}, {"key": "e35ec8afe496d466d673ac67d80ec5c21b163410", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.5, "ground_truth": 0}, {"key": "e35ec8afe496d466d673ac67d80ec5c21b163410", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.35577487267407293, "ground_truth": 0}, {"key": "e35ec8afe496d466d673ac67d80ec5c21b163410", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.29583986565233483, "ground_truth": 0}, {"key": "e35ec8afe496d466d673ac67d80ec5c21b163410", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.3942009450624917, "ground_truth": 0}, {"key": "e35ec8afe496d466d673ac67d80ec5c21b163410", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.573678384121597, "ground_truth": 0}, {"key": "b4aa207f0723ae8a731dbc07ecdb03a68a42031f", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.38861802861569744, "ground_truth": 0}, {"key": "b4aa207f0723ae8a731dbc07ecdb03a68a42031f", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.3468730879749848, "ground_truth": 0}, {"key": "b4aa207f0723ae8a731dbc07ecdb03a68a42031f", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.5813030847690416, "ground_truth": 0}, {"key": "b4aa207f0723ae8a731dbc07ecdb03a68a42031f", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.5136684586439324, "ground_truth": 0}, {"key": "b4aa207f0723ae8a731dbc07ecdb03a68a42031f", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.48438008014011186, "ground_truth": 0}, {"key": "a65ecd71682863f7b12ca11ab8ac23b39ae302c4", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.5175708549255003, "ground_truth": 0}, {"key": "a65ecd71682863f7b12ca11ab8ac23b39ae302c4", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.8278281450443802, "ground_truth": 0}, {"key": "a65ecd71682863f7b12ca11ab8ac23b39ae302c4", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.4863315314569029, "ground_truth": 0}, {"key": "a65ecd71682863f7b12ca11ab8ac23b39ae302c4", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.40168779690198, "ground_truth": 0}, {"key": "a65ecd71682863f7b12ca11ab8ac23b39ae302c4", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.501953091406201, "ground_truth": 0}, {"key": "215a2a64c7bd36360f76ec5e159690de07d7d959", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.3276683119649512, "ground_truth": 0}, {"key": "215a2a64c7bd36360f76ec5e159690de07d7d959", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.6740504618826785, "ground_truth": 0}, {"key": "215a2a64c7bd36360f76ec5e159690de07d7d959", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.25534365611790655, "ground_truth": 0}, {"key": "215a2a64c7bd36360f76ec5e159690de07d7d959", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.48633152804469065, "ground_truth": 0}, {"key": "215a2a64c7bd36360f76ec5e159690de07d7d959", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.3073580152433126, "ground_truth": 0}, {"key": "39074eb06df4966d1e06f76ad2f0713b31335fe5", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.8278281787767109, "ground_truth": 0}, {"key": "39074eb06df4966d1e06f76ad2f0713b31335fe5", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.8354835262627271, "ground_truth": 0}, {"key": "39074eb06df4966d1e06f76ad2f0713b31335fe5", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.8322366643679507, "ground_truth": 0}, {"key": "39074eb06df4966d1e06f76ad2f0713b31335fe5", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.8624675226414973, "ground_truth": 0}, {"key": "39074eb06df4966d1e06f76ad2f0713b31335fe5", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.48242912380854336, "ground_truth": 0}, {"key": "3cae0d9bcf97b5d182b20a31aaea3f41cd7bf599", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.44939264194215056, "ground_truth": 0}, {"key": "3cae0d9bcf97b5d182b20a31aaea3f41cd7bf599", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.6132365546203713, "ground_truth": 0}, {"key": "3cae0d9bcf97b5d182b20a31aaea3f41cd7bf599", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.5888891397053673, "ground_truth": 0}, {"key": "3cae0d9bcf97b5d182b20a31aaea3f41cd7bf599", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.5292633835116598, "ground_truth": 0}, {"key": "3cae0d9bcf97b5d182b20a31aaea3f41cd7bf599", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.5389831921210967, "ground_truth": 0}, {"key": "6a9ead70f9423e494c466189bc6d907071547f42", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.9241418176132274, "ground_truth": 0}, {"key": "6a9ead70f9423e494c466189bc6d907071547f42", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.9358173570389581, "ground_truth": 0}, {"key": "6a9ead70f9423e494c466189bc6d907071547f42", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.9693242013416311, "ground_truth": 0}, {"key": "6a9ead70f9423e494c466189bc6d907071547f42", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.8947894616291352, "ground_truth": 0}, {"key": "6a9ead70f9423e494c466189bc6d907071547f42", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.8289388206311975, "ground_truth": 0}, {"key": "9a15663058028878027f6aa039fb3185c2ff52c8", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.5078118713027322, "ground_truth": 0}, {"key": "9a15663058028878027f6aa039fb3185c2ff52c8", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.4532618273583226, "ground_truth": 0}, {"key": "9a15663058028878027f6aa039fb3185c2ff52c8", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.44939265125755584, "ground_truth": 0}, {"key": "9a15663058028878027f6aa039fb3185c2ff52c8", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.3923368443800761, "ground_truth": 0}, {"key": "9a15663058028878027f6aa039fb3185c2ff52c8", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.25982564595296687, "ground_truth": 0}, {"key": "83cb0c7e79d4c71703e1bd5fc346fe68be8b8b13", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.5525397016569618, "ground_truth": 0}, {"key": "83cb0c7e79d4c71703e1bd5fc346fe68be8b8b13", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.6150878492197499, "ground_truth": 0}, {"key": "83cb0c7e79d4c71703e1bd5fc346fe68be8b8b13", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.7813306192195952, "ground_truth": 0}, {"key": "83cb0c7e79d4c71703e1bd5fc346fe68be8b8b13", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.474631167279943, "ground_truth": 0}, {"key": "83cb0c7e79d4c71703e1bd5fc346fe68be8b8b13", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.5486735030303201, "ground_truth": 0}, {"key": "5eb63517219a5d2aeebd21aa66d9b69c52cfb208", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.5907792113968282, "ground_truth": 0}, {"key": "5eb63517219a5d2aeebd21aa66d9b69c52cfb208", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.592666602253705, "ground_truth": 0}, {"key": "5eb63517219a5d2aeebd21aa66d9b69c52cfb208", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.5, "ground_truth": 0}, {"key": "5eb63517219a5d2aeebd21aa66d9b69c52cfb208", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.6406358545331067, "ground_truth": 0}, {"key": "5eb63517219a5d2aeebd21aa66d9b69c52cfb208", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.7879311931894334, "ground_truth": 0}, {"key": "4a1de02b50578df33ea7b0cb384bdd6aaf4ee119", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.19559408275705442, "ground_truth": 0}, {"key": "4a1de02b50578df33ea7b0cb384bdd6aaf4ee119", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.26894143146474864, "ground_truth": 0}, {"key": "4a1de02b50578df33ea7b0cb384bdd6aaf4ee119", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.3073580217122274, "ground_truth": 0}, {"key": "4a1de02b50578df33ea7b0cb384bdd6aaf4ee119", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.26740816848338306, "ground_truth": 0}, {"key": "4a1de02b50578df33ea7b0cb384bdd6aaf4ee119", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.43014733477818, "ground_truth": 0}, {"key": "ddedfc2a349fb607ed7efeda1660e9807454ddb7", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.7813306257073507, "ground_truth": 0}, {"key": "ddedfc2a349fb607ed7efeda1660e9807454ddb7", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.9284088033076099, "ground_truth": 0}, {"key": "ddedfc2a349fb607ed7efeda1660e9807454ddb7", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.6224593234153428, "ground_truth": 0}, {"key": "ddedfc2a349fb607ed7efeda1660e9807454ddb7", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.7969253736393931, "ground_truth": 0}, {"key": "ddedfc2a349fb607ed7efeda1660e9807454ddb7", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.9079671394115111, "ground_truth": 0}, {"key": "1cce8238a161fda411022c350d2b9a49072f366f", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.42059959769671806, "ground_truth": 0}, {"key": "1cce8238a161fda411022c350d2b9a49072f366f", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.6791787072363529, "ground_truth": 0}, {"key": "1cce8238a161fda411022c350d2b9a49072f366f", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.5525397186463394, "ground_truth": 0}, {"key": "1cce8238a161fda411022c350d2b9a49072f366f", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.8596637365633726, "ground_truth": 0}, {"key": "1cce8238a161fda411022c350d2b9a49072f366f", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.7310585755766406, "ground_truth": 0}, {"key": "0612042c0c7d5cf6459f5435402919673c8c552f", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.635222426348975, "ground_truth": 0}, {"key": "0612042c0c7d5cf6459f5435402919673c8c552f", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.6513548449673237, "ground_truth": 0}, {"key": "0612042c0c7d5cf6459f5435402919673c8c552f", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.4148988170613943, "ground_truth": 0}, {"key": "0612042c0c7d5cf6459f5435402919673c8c552f", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.6297746200634965, "ground_truth": 0}, {"key": "0612042c0c7d5cf6459f5435402919673c8c552f", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.5794004161219767, "ground_truth": 0}, {"key": "cbe1f7ee7f5d619093684cc123e3908e39d79c92", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.517570883161073, "ground_truth": 0}, {"key": "cbe1f7ee7f5d619093684cc123e3908e39d79c92", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.6992544100490444, "ground_truth": 0}, {"key": "cbe1f7ee7f5d619093684cc123e3908e39d79c92", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.8365545698527307, "ground_truth": 0}, {"key": "cbe1f7ee7f5d619093684cc123e3908e39d79c92", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.7505527787979922, "ground_truth": 0}, {"key": "cbe1f7ee7f5d619093684cc123e3908e39d79c92", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.8469578407996174, "ground_truth": 0}, {"key": "42be47d5986a9a55b413eb57359d2d8c51b59024", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.5869964149369349, "ground_truth": 0}, {"key": "42be47d5986a9a55b413eb57359d2d8c51b59024", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.5640984899643062, "ground_truth": 0}, {"key": "42be47d5986a9a55b413eb57359d2d8c51b59024", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.26284183695742996, "ground_truth": 0}, {"key": "42be47d5986a9a55b413eb57359d2d8c51b59024", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.37204876943883947, "ground_truth": 0}, {"key": "42be47d5986a9a55b413eb57359d2d8c51b59024", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.42823337455958904, "ground_truth": 0}, {"key": "9f997964709283520a65d2ce75de7c8b154ce351", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.4551985824747869, "ground_truth": 0}, {"key": "9f997964709283520a65d2ce75de7c8b154ce351", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.379378405424134, "ground_truth": 0}, {"key": "9f997964709283520a65d2ce75de7c8b154ce351", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.5907792173532571, "ground_truth": 0}, {"key": "9f997964709283520a65d2ce75de7c8b154ce351", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.35042138113796595, "ground_truth": 0}, {"key": "9f997964709283520a65d2ce75de7c8b154ce351", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.2814056014635217, "ground_truth": 0}, {"key": "57da930302d81b46438b0f715a5218b7174a5611", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.8757869756104479, "ground_truth": 0}, {"key": "57da930302d81b46438b0f715a5218b7174a5611", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.8278281473973136, "ground_truth": 0}, {"key": "57da930302d81b46438b0f715a5218b7174a5611", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.7853085582931695, "ground_truth": 0}, {"key": "57da930302d81b46438b0f715a5218b7174a5611", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.8344068642124579, "ground_truth": 0}, {"key": "57da930302d81b46438b0f715a5218b7174a5611", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.9213576201342843, "ground_truth": 0}, {"key": "bc639974d283826b3b928bf90f0951652db71fd4", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.48828338440544483, "ground_truth": 0}, {"key": "bc639974d283826b3b928bf90f0951652db71fd4", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.7786493144124168, "ground_truth": 0}, {"key": "bc639974d283826b3b928bf90f0951652db71fd4", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.45132650112332556, "ground_truth": 0}, {"key": "bc639974d283826b3b928bf90f0951652db71fd4", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.5097643769045486, "ground_truth": 0}, {"key": "bc639974d283826b3b928bf90f0951652db71fd4", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.6477982261705065, "ground_truth": 0}, {"key": "304002bc095b57d14b728ccfb8d704ef39f28813", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.6688802286178614, "ground_truth": 0}, {"key": "304002bc095b57d14b728ccfb8d704ef39f28813", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.8244619253425302, "ground_truth": 0}, {"key": "304002bc095b57d14b728ccfb8d704ef39f28813", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.6992544245583995, "ground_truth": 0}, {"key": "304002bc095b57d14b728ccfb8d704ef39f28813", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.6495786236061354, "ground_truth": 0}, {"key": "304002bc095b57d14b728ccfb8d704ef39f28813", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.6893056392849721, "ground_truth": 0}, {"key": "fab941df6ecc8251b49d28715504baf4ac31dcf9", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.4824290954120204, "ground_truth": 0}, {"key": "fab941df6ecc8251b49d28715504baf4ac31dcf9", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.44167301793812164, "ground_truth": 0}, {"key": "fab941df6ecc8251b49d28715504baf4ac31dcf9", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.38121955282950976, "ground_truth": 0}, {"key": "fab941df6ecc8251b49d28715504baf4ac31dcf9", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.4785288447235175, "ground_truth": 0}, {"key": "fab941df6ecc8251b49d28715504baf4ac31dcf9", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.3593641369309194, "ground_truth": 0}, {"key": "92dec9732f4244771770150d82cd6086f40e5621", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.7648916205656592, "ground_truth": 0}, {"key": "92dec9732f4244771770150d82cd6086f40e5621", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.8643104579656771, "ground_truth": 0}, {"key": "92dec9732f4244771770150d82cd6086f40e5621", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.5907792106051852, "ground_truth": 0}, {"key": "92dec9732f4244771770150d82cd6086f40e5621", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.5774953949081072, "ground_truth": 0}, {"key": "92dec9732f4244771770150d82cd6086f40e5621", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.8278281668436667, "ground_truth": 0}, {"key": "d2ed554726c632af6e2130a580964a261f8c2e60", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.18242553327761316, "ground_truth": 0}, {"key": "d2ed554726c632af6e2130a580964a261f8c2e60", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.2974699559544041, "ground_truth": 0}, {"key": "d2ed554726c632af6e2130a580964a261f8c2e60", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.36116471439406167, "ground_truth": 0}, {"key": "d2ed554726c632af6e2130a580964a261f8c2e60", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.29746996048305807, "ground_truth": 0}, {"key": "d2ed554726c632af6e2130a580964a261f8c2e60", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.3106944022060496, "ground_truth": 0}, {"key": "84ab5256295369509813877f5000bb7e01e7f641", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.8688267788157529, "ground_truth": 0}, {"key": "84ab5256295369509813877f5000bb7e01e7f641", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.6442251202578249, "ground_truth": 0}, {"key": "84ab5256295369509813877f5000bb7e01e7f641", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.7490872323498757, "ground_truth": 0}, {"key": "84ab5256295369509813877f5000bb7e01e7f641", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.8757869999071604, "ground_truth": 0}, {"key": "84ab5256295369509813877f5000bb7e01e7f641", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.8006920229032158, "ground_truth": 0}, {"key": "0e3f2fa30b711144fd8e49dedd6c248542a9083c", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.8606036220366889, "ground_truth": 0}, {"key": "0e3f2fa30b711144fd8e49dedd6c248542a9083c", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.8816148992680141, "ground_truth": 0}, {"key": "0e3f2fa30b711144fd8e49dedd6c248542a9083c", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.8774767856972234, "ground_truth": 0}, {"key": "0e3f2fa30b711144fd8e49dedd6c248542a9083c", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.6388352931322328, "ground_truth": 0}, {"key": "0e3f2fa30b711144fd8e49dedd6c248542a9083c", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.859663753497594, "ground_truth": 0}, {"key": "67ab697c3e2d707e3b7d070199b065b1541c8925", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.8104789087376586, "ground_truth": 0}, {"key": "67ab697c3e2d707e3b7d070199b065b1541c8925", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.6424324865014002, "ground_truth": 0}, {"key": "67ab697c3e2d707e3b7d070199b065b1541c8925", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.7431679945372904, "ground_truth": 0}, {"key": "67ab697c3e2d707e3b7d070199b065b1541c8925", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.6636689359710864, "ground_truth": 0}, {"key": "67ab697c3e2d707e3b7d070199b065b1541c8925", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.8198933381250064, "ground_truth": 0}, {"key": "71537a701b69838dcb68ae310c7b3bfb375c1344", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.13846180269662706, "ground_truth": 0}, {"key": "71537a701b69838dcb68ae310c7b3bfb375c1344", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.5448014044494417, "ground_truth": 0}, {"key": "71537a701b69838dcb68ae310c7b3bfb375c1344", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.47657963551532256, "ground_truth": 0}, {"key": "71537a701b69838dcb68ae310c7b3bfb375c1344", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.23510839974222, "ground_truth": 0}, {"key": "71537a701b69838dcb68ae310c7b3bfb375c1344", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.2509127886923641, "ground_truth": 0}, {"key": "83989da5142972bb45c7f1e25ea60c6b101a9987", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.7431680074759255, "ground_truth": 0}, {"key": "83989da5142972bb45c7f1e25ea60c6b101a9987", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.8509646934742214, "ground_truth": 0}, {"key": "83989da5142972bb45c7f1e25ea60c6b101a9987", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.6442251251213298, "ground_truth": 0}, {"key": "83989da5142972bb45c7f1e25ea60c6b101a9987", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.7676898491756206, "ground_truth": 0}, {"key": "83989da5142972bb45c7f1e25ea60c6b101a9987", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.7446563638371464, "ground_truth": 0}, {"key": "cc432e8a26891d7fcb62b112f868e994532a7ba7", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.3629691957940513, "ground_truth": 0}, {"key": "cc432e8a26891d7fcb62b112f868e994532a7ba7", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.3415825108516612, "ground_truth": 0}, {"key": "cc432e8a26891d7fcb62b112f868e994532a7ba7", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.585101141221045, "ground_truth": 0}, {"key": "cc432e8a26891d7fcb62b112f868e994532a7ba7", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.3191213850180411, "ground_truth": 0}, {"key": "cc432e8a26891d7fcb62b112f868e994532a7ba7", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.4263215892772059, "ground_truth": 0}, {"key": "ef024e4ca04bd445d2915e7fe5c2c3c9b6f723a2", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.386763444495727, "ground_truth": 0}, {"key": "ef024e4ca04bd445d2915e7fe5c2c3c9b6f723a2", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.33111972011662066, "ground_truth": 0}, {"key": "ef024e4ca04bd445d2915e7fe5c2c3c9b6f723a2", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.4843800907506999, "ground_truth": 0}, {"key": "ef024e4ca04bd445d2915e7fe5c2c3c9b6f723a2", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.38861801927148043, "ground_truth": 0}, {"key": "ef024e4ca04bd445d2915e7fe5c2c3c9b6f723a2", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.2942149803297599, "ground_truth": 0}, {"key": "dfc606b97c43ac249d72cff2fe812213987a37a2", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.3208212749646367, "ground_truth": 0}, {"key": "dfc606b97c43ac249d72cff2fe812213987a37a2", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.4244119807085347, "ground_truth": 0}, {"key": "dfc606b97c43ac249d72cff2fe812213987a37a2", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.39606815211643687, "ground_truth": 0}, {"key": "dfc606b97c43ac249d72cff2fe812213987a37a2", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.3702254032187766, "ground_truth": 0}, {"key": "dfc606b97c43ac249d72cff2fe812213987a37a2", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.24508501257140358, "ground_truth": 0}, {"key": "087ac92e2ca469b5ca6277950e63b2f0706d0de2", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.4707366107473725, "ground_truth": 0}, {"key": "087ac92e2ca469b5ca6277950e63b2f0706d0de2", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.191932787342938, "ground_truth": 0}, {"key": "087ac92e2ca469b5ca6277950e63b2f0706d0de2", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.30239109144921966, "ground_truth": 0}, {"key": "087ac92e2ca469b5ca6277950e63b2f0706d0de2", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.4148988303287921, "ground_truth": 0}, {"key": "087ac92e2ca469b5ca6277950e63b2f0706d0de2", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.3886180265198153, "ground_truth": 0}, {"key": "a1abb9ce1c76a6c390233d8ec934cfb34bc35215", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.675764610592343, "ground_truth": 0}, {"key": "a1abb9ce1c76a6c390233d8ec934cfb34bc35215", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.654894706391696, "ground_truth": 0}, {"key": "a1abb9ce1c76a6c390233d8ec934cfb34bc35215", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.6169358274868777, "ground_truth": 0}, {"key": "a1abb9ce1c76a6c390233d8ec934cfb34bc35215", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.616935819264724, "ground_truth": 0}, {"key": "a1abb9ce1c76a6c390233d8ec934cfb34bc35215", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.451326520063063, "ground_truth": 0}, {"key": "99ec57979392a7f9c1a24158d5e1262cdf113f45", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.6187804230341435, "ground_truth": 0}, {"key": "99ec57979392a7f9c1a24158d5e1262cdf113f45", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.5117165892984104, "ground_truth": 0}, {"key": "99ec57979392a7f9c1a24158d5e1262cdf113f45", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.6132365813364887, "ground_truth": 0}, {"key": "99ec57979392a7f9c1a24158d5e1262cdf113f45", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.7799928920502492, "ground_truth": 0}, {"key": "99ec57979392a7f9c1a24158d5e1262cdf113f45", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.7386690795706381, "ground_truth": 0}, {"key": "ca5c0c816376354b82a4a7b9fa9a31b655e2d2cd", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.5195213324278616, "ground_truth": 0}, {"key": "ca5c0c816376354b82a4a7b9fa9a31b655e2d2cd", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.46101678102027444, "ground_truth": 0}, {"key": "ca5c0c816376354b82a4a7b9fa9a31b655e2d2cd", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.47073660979268517, "ground_truth": 0}, {"key": "ca5c0c816376354b82a4a7b9fa9a31b655e2d2cd", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.3276683049595594, "ground_truth": 0}, {"key": "ca5c0c816376354b82a4a7b9fa9a31b655e2d2cd", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.4707365904388476, "ground_truth": 0}, {"key": "e9787bf9462b12b7dfc0b562510a551e7d07b4d7", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.7233094600050839, "ground_truth": 0}, {"key": "e9787bf9462b12b7dfc0b562510a551e7d07b4d7", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.7534666539803128, "ground_truth": 0}, {"key": "e9787bf9462b12b7dfc0b562510a551e7d07b4d7", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.564098472926293, "ground_truth": 0}, {"key": "e9787bf9462b12b7dfc0b562510a551e7d07b4d7", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.5964331398357534, "ground_truth": 0}, {"key": "e9787bf9462b12b7dfc0b562510a551e7d07b4d7", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.7676898530244385, "ground_truth": 0}, {"key": "ed8a7d5b06b4b5415725e624a15ab5ada7146894", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.8606036194434924, "ground_truth": 0}, {"key": "ed8a7d5b06b4b5415725e624a15ab5ada7146894", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.7690802498340704, "ground_truth": 0}, {"key": "ed8a7d5b06b4b5415725e624a15ab5ada7146894", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.7170118778074412, "ground_truth": 0}, {"key": "ed8a7d5b06b4b5415725e624a15ab5ada7146894", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.8175744704942696, "ground_truth": 0}, {"key": "ed8a7d5b06b4b5415725e624a15ab5ada7146894", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.6460137020547919, "ground_truth": 0}, {"key": "4b6f2532f6bb4cf4ae341e4fb72d384ef58f0f42", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.359364144559971, "ground_truth": 0}, {"key": "4b6f2532f6bb4cf4ae341e4fb72d384ef58f0f42", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.3720487884905282, "ground_truth": 0}, {"key": "4b6f2532f6bb4cf4ae341e4fb72d384ef58f0f42", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.4941409048937074, "ground_truth": 0}, {"key": "4b6f2532f6bb4cf4ae341e4fb72d384ef58f0f42", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.40544873126098374, "ground_truth": 0}, {"key": "4b6f2532f6bb4cf4ae341e4fb72d384ef58f0f42", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.31912139686374913, "ground_truth": 0}, {"key": "46102a68e2927f930c1c2bd117ca714d188cd1ab", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.4455295227239426, "ground_truth": 0}, {"key": "46102a68e2927f930c1c2bd117ca714d188cd1ab", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.5370413900034009, "ground_truth": 0}, {"key": "46102a68e2927f930c1c2bd117ca714d188cd1ab", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.513668447793394, "ground_truth": 0}, {"key": "46102a68e2927f930c1c2bd117ca714d188cd1ab", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.5660185441352402, "ground_truth": 0}, {"key": "46102a68e2927f930c1c2bd117ca714d188cd1ab", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.5717666083704122, "ground_truth": 0}, {"key": "ee6568a8880e61a498aab80c41f70939d567c991", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.2613309326839637, "ground_truth": 0}, {"key": "ee6568a8880e61a498aab80c41f70939d567c991", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.4263215666134083, "ground_truth": 0}, {"key": "ee6568a8880e61a498aab80c41f70939d567c991", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.16776334139163268, "ground_truth": 0}, {"key": "ee6568a8880e61a498aab80c41f70939d567c991", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.3007455869201486, "ground_truth": 0}, {"key": "ee6568a8880e61a498aab80c41f70939d567c991", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.4551986031015672, "ground_truth": 0}, {"key": "8f462be265750ebbf85a6ad8ef28cb39c59f826e", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.5717665962393881, "ground_truth": 0}, {"key": "8f462be265750ebbf85a6ad8ef28cb39c59f826e", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.5888891408182902, "ground_truth": 0}, {"key": "8f462be265750ebbf85a6ad8ef28cb39c59f826e", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.38676344176721794, "ground_truth": 0}, {"key": "8f462be265750ebbf85a6ad8ef28cb39c59f826e", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.5621765128607878, "ground_truth": 0}, {"key": "8f462be265750ebbf85a6ad8ef28cb39c59f826e", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.7431680202489892, "ground_truth": 0}, {"key": "b21258342db561f79656c3c75f2e8c8244dd6178", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.749087218697299, "ground_truth": 0}, {"key": "b21258342db561f79656c3c75f2e8c8244dd6178", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.7138307478610049, "ground_truth": 0}, {"key": "b21258342db561f79656c3c75f2e8c8244dd6178", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.5467381856029103, "ground_truth": 0}, {"key": "b21258342db561f79656c3c75f2e8c8244dd6178", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.5679366170208442, "ground_truth": 0}, {"key": "b21258342db561f79656c3c75f2e8c8244dd6178", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.8459424344974357, "ground_truth": 0}, {"key": "c7b97c7c2ca7b9bedff4978dd3cae9aaef8f8100", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.6460136924365706, "ground_truth": 0}, {"key": "c7b97c7c2ca7b9bedff4978dd3cae9aaef8f8100", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.5156199194609081, "ground_truth": 0}, {"key": "c7b97c7c2ca7b9bedff4978dd3cae9aaef8f8100", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.4824291085768571, "ground_truth": 0}, {"key": "c7b97c7c2ca7b9bedff4978dd3cae9aaef8f8100", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.47657964184323454, "ground_truth": 0}, {"key": "c7b97c7c2ca7b9bedff4978dd3cae9aaef8f8100", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.631594313442873, "ground_truth": 0}, {"key": "bdbeb9265050f2a4ce200c3802775694b7dc20e6", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.49218814096096747, "ground_truth": 0}, {"key": "bdbeb9265050f2a4ce200c3802775694b7dc20e6", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.5621765049871014, "ground_truth": 0}, {"key": "bdbeb9265050f2a4ce200c3802775694b7dc20e6", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.6132365447917033, "ground_truth": 0}, {"key": "bdbeb9265050f2a4ce200c3802775694b7dc20e6", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.5467381524352007, "ground_truth": 0}, {"key": "bdbeb9265050f2a4ce200c3802775694b7dc20e6", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.3486451342469818, "ground_truth": 0}, {"key": "42e93d5aef7547b8169f1f6c7735d0265a030580", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.8104788996617174, "ground_truth": 0}, {"key": "42e93d5aef7547b8169f1f6c7735d0265a030580", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.6315943115419033, "ground_truth": 0}, {"key": "42e93d5aef7547b8169f1f6c7735d0265a030580", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.6057990527634245, "ground_truth": 0}, {"key": "42e93d5aef7547b8169f1f6c7735d0265a030580", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.5292633760559152, "ground_truth": 0}, {"key": "42e93d5aef7547b8169f1f6c7735d0265a030580", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.7606506656031725, "ground_truth": 0}, {"key": "6e7a607934780f0011aa4e84509314efe15c2685", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.7325918553967611, "ground_truth": 0}, {"key": "6e7a607934780f0011aa4e84509314efe15c2685", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.702530073988465, "ground_truth": 0}, {"key": "6e7a607934780f0011aa4e84509314efe15c2685", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.7170119003841698, "ground_truth": 0}, {"key": "6e7a607934780f0011aa4e84509314efe15c2685", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.5448013983772828, "ground_truth": 0}, {"key": "6e7a607934780f0011aa4e84509314efe15c2685", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.810478917510183, "ground_truth": 0}, {"key": "c087e2af172aed145b177c9a1a68029205bc732a", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.4397473253613203, "ground_truth": 0}, {"key": "c087e2af172aed145b177c9a1a68029205bc732a", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.6113819764192309, "ground_truth": 0}, {"key": "c087e2af172aed145b177c9a1a68029205bc732a", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.5292633934107194, "ground_truth": 0}, {"key": "c087e2af172aed145b177c9a1a68029205bc732a", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.6132365537905807, "ground_truth": 0}, {"key": "c087e2af172aed145b177c9a1a68029205bc732a", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.5525397029469087, "ground_truth": 0}, {"key": "40e79de5b7a27d7161b147725936d1d47e45c8f9", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.810478906126883, "ground_truth": 0}, {"key": "40e79de5b7a27d7161b147725936d1d47e45c8f9", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.7676898519422997, "ground_truth": 0}, {"key": "40e79de5b7a27d7161b147725936d1d47e45c8f9", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.8092759771365339, "ground_truth": 0}, {"key": "40e79de5b7a27d7161b147725936d1d47e45c8f9", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.7563575727375352, "ground_truth": 0}, {"key": "40e79de5b7a27d7161b147725936d1d47e45c8f9", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.7490872021859958, "ground_truth": 0}, {"key": "e878909ace599352d3d578796968bbd52cb299bd", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.4092207824795196, "ground_truth": 0}, {"key": "e878909ace599352d3d578796968bbd52cb299bd", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.3923368400407502, "ground_truth": 0}, {"key": "e878909ace599352d3d578796968bbd52cb299bd", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.3942009707554547, "ground_truth": 0}, {"key": "e878909ace599352d3d578796968bbd52cb299bd", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.6057990272041439, "ground_truth": 0}, {"key": "e878909ace599352d3d578796968bbd52cb299bd", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.5717666298855769, "ground_truth": 0}, {"key": "470708aab0fe600a27423bf4a2f8c9860fe5f64b", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.7563575456706607, "ground_truth": 0}, {"key": "470708aab0fe600a27423bf4a2f8c9860fe5f64b", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.844921528830882, "ground_truth": 0}, {"key": "470708aab0fe600a27423bf4a2f8c9860fe5f64b", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.5755879796259535, "ground_truth": 0}, {"key": "470708aab0fe600a27423bf4a2f8c9860fe5f64b", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.620621651016609, "ground_truth": 0}, {"key": "470708aab0fe600a27423bf4a2f8c9860fe5f64b", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.7264256024175524, "ground_truth": 0}, {"key": "16e8cb520c874af6825d4661f6127a67efd4b6f6", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.6424324625898328, "ground_truth": 0}, {"key": "16e8cb520c874af6825d4661f6127a67efd4b6f6", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.6460136909523942, "ground_truth": 0}, {"key": "16e8cb520c874af6825d4661f6127a67efd4b6f6", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.7866228270021128, "ground_truth": 0}, {"key": "16e8cb520c874af6825d4661f6127a67efd4b6f6", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.6095241607361553, "ground_truth": 0}, {"key": "16e8cb520c874af6825d4661f6127a67efd4b6f6", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.548673485567175, "ground_truth": 0}, {"key": "38673348ff28676905791fe3e8db2bbda814d974", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.32082129462066455, "ground_truth": 0}, {"key": "38673348ff28676905791fe3e8db2bbda814d974", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.43014735988702496, "ground_truth": 0}, {"key": "38673348ff28676905791fe3e8db2bbda814d974", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.46101679214858765, "ground_truth": 0}, {"key": "38673348ff28676905791fe3e8db2bbda814d974", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.548673478116398, "ground_truth": 0}, {"key": "38673348ff28676905791fe3e8db2bbda814d974", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.32252599119236325, "ground_truth": 0}, {"key": "914a0163e25ecccb635b601837cc4dd552c66ce0", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.35042137679573, "ground_truth": 0}, {"key": "914a0163e25ecccb635b601837cc4dd552c66ce0", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.494140895350691, "ground_truth": 0}, {"key": "914a0163e25ecccb635b601837cc4dd552c66ce0", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.4320633680484784, "ground_truth": 0}, {"key": "914a0163e25ecccb635b601837cc4dd552c66ce0", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.2798284960506482, "ground_truth": 0}, {"key": "914a0163e25ecccb635b601837cc4dd552c66ce0", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.468790630763461, "ground_truth": 0}, {"key": "851c7314af56b6f47742970e11696948323dfe94", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.5813030783566604, "ground_truth": 0}, {"key": "851c7314af56b6f47742970e11696948323dfe94", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.7217432135319642, "ground_truth": 0}, {"key": "851c7314af56b6f47742970e11696948323dfe94", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.6370308015392627, "ground_truth": 0}, {"key": "851c7314af56b6f47742970e11696948323dfe94", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.6424324727097293, "ground_truth": 0}, {"key": "851c7314af56b6f47742970e11696948323dfe94", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.7772998681776881, "ground_truth": 0}, {"key": "f29f04e8f0615b768dd756c4387e87e27b7b4c2d", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.4960938405144254, "ground_truth": 0}, {"key": "f29f04e8f0615b768dd756c4387e87e27b7b4c2d", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.6020615815951419, "ground_truth": 0}, {"key": "f29f04e8f0615b768dd756c4387e87e27b7b4c2d", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.36477758587449965, "ground_truth": 0}, {"key": "f29f04e8f0615b768dd756c4387e87e27b7b4c2d", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.2814055911140071, "ground_truth": 0}, {"key": "f29f04e8f0615b768dd756c4387e87e27b7b4c2d", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.2568320030169906, "ground_truth": 0}, {"key": "8451164e86012e6dbf2fd39f7e6ca784ff9f3624", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.8449215351929381, "ground_truth": 0}, {"key": "8451164e86012e6dbf2fd39f7e6ca784ff9f3624", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.9053222997664628, "ground_truth": 0}, {"key": "8451164e86012e6dbf2fd39f7e6ca784ff9f3624", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.7718435117841271, "ground_truth": 0}, {"key": "8451164e86012e6dbf2fd39f7e6ca784ff9f3624", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.8499711816127444, "ground_truth": 0}, {"key": "8451164e86012e6dbf2fd39f7e6ca784ff9f3624", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.8757869911773046, "ground_truth": 0}, {"key": "18765fda59852b1c13eb226a2da9ab0979739f44", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.7310585863188214, "ground_truth": 0}, {"key": "18765fda59852b1c13eb226a2da9ab0979739f44", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.7931059562935271, "ground_truth": 0}, {"key": "18765fda59852b1c13eb226a2da9ab0979739f44", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.8164063912454421, "ground_truth": 0}, {"key": "18765fda59852b1c13eb226a2da9ab0979739f44", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.9500414746828559, "ground_truth": 0}, {"key": "18765fda59852b1c13eb226a2da9ab0979739f44", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.8311430534522686, "ground_truth": 0}, {"key": "fba410776268aaf447802e66ac94e4af54f7cb7a", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.9403530618921538, "ground_truth": 0}, {"key": "fba410776268aaf447802e66ac94e4af54f7cb7a", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.9529258235120794, "ground_truth": 0}, {"key": "fba410776268aaf447802e66ac94e4af54f7cb7a", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.8300437616300826, "ground_truth": 0}, {"key": "fba410776268aaf447802e66ac94e4af54f7cb7a", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.884837759914921, "ground_truth": 0}, {"key": "fba410776268aaf447802e66ac94e4af54f7cb7a", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.9173026607058344, "ground_truth": 0}, {"key": "31494e5d6eda2042c4793ae68cea4b8304dfa0ad", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.8807970786255185, "ground_truth": 0}, {"key": "31494e5d6eda2042c4793ae68cea4b8304dfa0ad", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.9079671359444922, "ground_truth": 0}, {"key": "31494e5d6eda2042c4793ae68cea4b8304dfa0ad", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.9149009460203902, "ground_truth": 0}, {"key": "31494e5d6eda2042c4793ae68cea4b8304dfa0ad", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.9263037313521212, "ground_truth": 0}, {"key": "31494e5d6eda2042c4793ae68cea4b8304dfa0ad", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.9399133527285571, "ground_truth": 0}, {"key": "564bdb9bbcd2276bdfbdce6eb1e2058f0921bd82", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.6513548668112599, "ground_truth": 0}, {"key": "564bdb9bbcd2276bdfbdce6eb1e2058f0921bd82", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.8783142557020737, "ground_truth": 0}, {"key": "564bdb9bbcd2276bdfbdce6eb1e2058f0921bd82", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.8509647024833328, "ground_truth": 0}, {"key": "564bdb9bbcd2276bdfbdce6eb1e2058f0921bd82", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.5774953424609457, "ground_truth": 0}, {"key": "564bdb9bbcd2276bdfbdce6eb1e2058f0921bd82", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.8856314759324297, "ground_truth": 0}, {"key": "acbacec078274c02aeae06061357d02d950fec33", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.8322366623951742, "ground_truth": 0}, {"key": "acbacec078274c02aeae06061357d02d950fec33", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.8606036339805995, "ground_truth": 0}, {"key": "acbacec078274c02aeae06061357d02d950fec33", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.9005297885886184, "ground_truth": 0}, {"key": "acbacec078274c02aeae06061357d02d950fec33", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.8210441270502562, "ground_truth": 0}, {"key": "acbacec078274c02aeae06061357d02d950fec33", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.8233284021807096, "ground_truth": 0}, {"key": "04327bc3e426eee01ed61d369fd52415aa300ddc", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.700894811469649, "ground_truth": 0}, {"key": "04327bc3e426eee01ed61d369fd52415aa300ddc", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.6187804265892666, "ground_truth": 0}, {"key": "04327bc3e426eee01ed61d369fd52415aa300ddc", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.7704647844595873, "ground_truth": 0}, {"key": "04327bc3e426eee01ed61d369fd52415aa300ddc", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.6477982353818622, "ground_truth": 0}, {"key": "04327bc3e426eee01ed61d369fd52415aa300ddc", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.4378234916371501, "ground_truth": 0}, {"key": "b1f3d2adb48370e5ecadff8e6e3baff407b01f0e", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.7620700947404111, "ground_truth": 0}, {"key": "b1f3d2adb48370e5ecadff8e6e3baff407b01f0e", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.7606506534522367, "ground_truth": 0}, {"key": "b1f3d2adb48370e5ecadff8e6e3baff407b01f0e", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.7931059425708509, "ground_truth": 0}, {"key": "b1f3d2adb48370e5ecadff8e6e3baff407b01f0e", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.6706082902310732, "ground_truth": 0}, {"key": "b1f3d2adb48370e5ecadff8e6e3baff407b01f0e", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.5794004070386259, "ground_truth": 0}, {"key": "d7eaf2e5ca91bf54c05ead867e5e90728d44e218", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.8128673037223175, "ground_truth": 0}, {"key": "d7eaf2e5ca91bf54c05ead867e5e90728d44e218", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.7892337092672022, "ground_truth": 0}, {"key": "d7eaf2e5ca91bf54c05ead867e5e90728d44e218", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.6893056042435493, "ground_truth": 0}, {"key": "d7eaf2e5ca91bf54c05ead867e5e90728d44e218", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.8705972755513941, "ground_truth": 0}, {"key": "d7eaf2e5ca91bf54c05ead867e5e90728d44e218", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.7690802527338996, "ground_truth": 0}, {"key": "1fcce9f667de2a14d76aaa6cdb3f1e6f7900e463", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.9553191296457688, "ground_truth": 0}, {"key": "1fcce9f667de2a14d76aaa6cdb3f1e6f7900e463", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.8832359918538786, "ground_truth": 0}, {"key": "1fcce9f667de2a14d76aaa6cdb3f1e6f7900e463", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.9224823405218598, "ground_truth": 0}, {"key": "1fcce9f667de2a14d76aaa6cdb3f1e6f7900e463", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.9124361536659289, "ground_truth": 0}, {"key": "1fcce9f667de2a14d76aaa6cdb3f1e6f7900e463", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.8969755717442541, "ground_truth": 0}, {"key": "892f75a4d31560b60aa588faa6f4bf51322b8c18", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.8624675462069678, "ground_truth": 0}, {"key": "892f75a4d31560b60aa588faa6f4bf51322b8c18", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.9142907251299369, "ground_truth": 0}, {"key": "892f75a4d31560b60aa588faa6f4bf51322b8c18", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.8998277824974187, "ground_truth": 0}, {"key": "892f75a4d31560b60aa588faa6f4bf51322b8c18", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.8418256495718847, "ground_truth": 0}, {"key": "892f75a4d31560b60aa588faa6f4bf51322b8c18", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.916109605302344, "ground_truth": 0}, {"key": "acf12bd8d1142648b1b522a3a925e14e48b8f068", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.8116760178607471, "ground_truth": 0}, {"key": "acf12bd8d1142648b1b522a3a925e14e48b8f068", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.8643104579656771, "ground_truth": 0}, {"key": "acf12bd8d1142648b1b522a3a925e14e48b8f068", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.5851011630521386, "ground_truth": 0}, {"key": "acf12bd8d1142648b1b522a3a925e14e48b8f068", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.7505527691956941, "ground_truth": 0}, {"key": "acf12bd8d1142648b1b522a3a925e14e48b8f068", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.7025300763124264, "ground_truth": 0}, {"key": "c8caeb08b05cc56e1ac29146793ceb07e4c0de69", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.6926419904011563, "ground_truth": 0}, {"key": "c8caeb08b05cc56e1ac29146793ceb07e4c0de69", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.6601723693835615, "ground_truth": 0}, {"key": "c8caeb08b05cc56e1ac29146793ceb07e4c0de69", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.6548947219379546, "ground_truth": 0}, {"key": "c8caeb08b05cc56e1ac29146793ceb07e4c0de69", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.6893056189530563, "ground_truth": 0}, {"key": "c8caeb08b05cc56e1ac29146793ceb07e4c0de69", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.7154239931576005, "ground_truth": 0}, {"key": "ed7ed4440f5f7082230ae745d240350a4f20b8b7", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.6791786948615491, "ground_truth": 0}, {"key": "ed7ed4440f5f7082230ae745d240350a4f20b8b7", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.5428632882451555, "ground_truth": 0}, {"key": "ed7ed4440f5f7082230ae745d240350a4f20b8b7", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.7279754650630642, "ground_truth": 0}, {"key": "ed7ed4440f5f7082230ae745d240350a4f20b8b7", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.5097643895852892, "ground_truth": 0}, {"key": "ed7ed4440f5f7082230ae745d240350a4f20b8b7", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.47852883637539917, "ground_truth": 0}, {"key": "25b7adf8bfe43c2953a874b18c7766370158638a", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.55447045278737, "ground_truth": 0}, {"key": "25b7adf8bfe43c2953a874b18c7766370158638a", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.5409238790098415, "ground_truth": 0}, {"key": "25b7adf8bfe43c2953a874b18c7766370158638a", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.5156199343917722, "ground_truth": 0}, {"key": "25b7adf8bfe43c2953a874b18c7766370158638a", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.6169358403258431, "ground_truth": 0}, {"key": "25b7adf8bfe43c2953a874b18c7766370158638a", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.6548947050906536, "ground_truth": 0}, {"key": "771c125e3b0c54f1c3367b2857f15d689f081163", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.7662936544716485, "ground_truth": 0}, {"key": "771c125e3b0c54f1c3367b2857f15d689f081163", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.6548947573440463, "ground_truth": 0}, {"key": "771c125e3b0c54f1c3367b2857f15d689f081163", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.7786493048648087, "ground_truth": 0}, {"key": "771c125e3b0c54f1c3367b2857f15d689f081163", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.8824278696275053, "ground_truth": 0}, {"key": "771c125e3b0c54f1c3367b2857f15d689f081163", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.7826624721319594, "ground_truth": 0}, {"key": "4ad70f84c363e5b594da00983e2b40600f12ca54", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.6943026672980656, "ground_truth": 0}, {"key": "4ad70f84c363e5b594da00983e2b40600f12ca54", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.7201714901908689, "ground_truth": 0}, {"key": "4ad70f84c363e5b594da00983e2b40600f12ca54", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.764891607705419, "ground_truth": 0}, {"key": "4ad70f84c363e5b594da00983e2b40600f12ca54", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.6654105530794913, "ground_truth": 0}, {"key": "4ad70f84c363e5b594da00983e2b40600f12ca54", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.8633915998099632, "ground_truth": 0}, {"key": "cbb5654e979eb27e0af71068cd4e4e5191df35ee", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.5888891189329273, "ground_truth": 0}, {"key": "cbb5654e979eb27e0af71068cd4e4e5191df35ee", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.6242935283362965, "ground_truth": 0}, {"key": "cbb5654e979eb27e0af71068cd4e4e5191df35ee", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.6132365532439565, "ground_truth": 0}, {"key": "cbb5654e979eb27e0af71068cd4e4e5191df35ee", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.6076631616597712, "ground_truth": 0}, {"key": "cbb5654e979eb27e0af71068cd4e4e5191df35ee", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.6406358708090171, "ground_truth": 0}, {"key": "bde6b7e505c05a15a9afe44739e7f016ce169735", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.2942149795006732, "ground_truth": 0}, {"key": "bde6b7e505c05a15a9afe44739e7f016ce169735", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.2845760056735838, "ground_truth": 0}, {"key": "bde6b7e505c05a15a9afe44739e7f016ce169735", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.3451052820321839, "ground_truth": 0}, {"key": "bde6b7e505c05a15a9afe44739e7f016ce169735", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.2628418413936867, "ground_truth": 0}, {"key": "bde6b7e505c05a15a9afe44739e7f016ce169735", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.6757645965012699, "ground_truth": 0}, {"key": "abc4744227c6bf0ddbf64cac2269bd4c6d02938b", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.12678517266706588, "ground_truth": 0}, {"key": "abc4744227c6bf0ddbf64cac2269bd4c6d02938b", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.4436004268581273, "ground_truth": 0}, {"key": "abc4744227c6bf0ddbf64cac2269bd4c6d02938b", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.22541662938287874, "ground_truth": 0}, {"key": "abc4744227c6bf0ddbf64cac2269bd4c6d02938b", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.1980641841306636, "ground_truth": 0}, {"key": "abc4744227c6bf0ddbf64cac2269bd4c6d02938b", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.20946967879565404, "ground_truth": 0}, {"key": "f7e5e75031e9f099564ed046bd822ef1bedb3188", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.7008948091032341, "ground_truth": 0}, {"key": "f7e5e75031e9f099564ed046bd822ef1bedb3188", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.7310585591968893, "ground_truth": 0}, {"key": "f7e5e75031e9f099564ed046bd822ef1bedb3188", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.6242935425213345, "ground_truth": 0}, {"key": "f7e5e75031e9f099564ed046bd822ef1bedb3188", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.6825737245577804, "ground_truth": 0}, {"key": "f7e5e75031e9f099564ed046bd822ef1bedb3188", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.6513548639891493, "ground_truth": 0}, {"key": "9a8ee7eb582f293c617eecab5f37374d9400bb04", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.8006919894461054, "ground_truth": 0}, {"key": "9a8ee7eb582f293c617eecab5f37374d9400bb04", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.19193279820258316, "ground_truth": 0}, {"key": "9a8ee7eb582f293c617eecab5f37374d9400bb04", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.3904758351200328, "ground_truth": 0}, {"key": "9a8ee7eb582f293c617eecab5f37374d9400bb04", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.21866938203378034, "ground_truth": 0}, {"key": "9a8ee7eb582f293c617eecab5f37374d9400bb04", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.4668455943203461, "ground_truth": 0}, {"key": "a745e5a95be983cde00f3d472062c0627db3113c", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.5544704853539312, "ground_truth": 0}, {"key": "a745e5a95be983cde00f3d472062c0627db3113c", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.4320633716733965, "ground_truth": 0}, {"key": "a745e5a95be983cde00f3d472062c0627db3113c", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.5506073532313859, "ground_truth": 0}, {"key": "a745e5a95be983cde00f3d472062c0627db3113c", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.30569734118493025, "ground_truth": 0}, {"key": "a745e5a95be983cde00f3d472062c0627db3113c", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.49023558326714656, "ground_truth": 0}, {"key": "698cdb1268d4da1240d7f540bd4a5af4e229d00f", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.6774740407914293, "ground_truth": 0}, {"key": "698cdb1268d4da1240d7f540bd4a5af4e229d00f", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.6757645988142228, "ground_truth": 0}, {"key": "698cdb1268d4da1240d7f540bd4a5af4e229d00f", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.6370307914491793, "ground_truth": 0}, {"key": "698cdb1268d4da1240d7f540bd4a5af4e229d00f", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.3225260125422443, "ground_truth": 0}, {"key": "698cdb1268d4da1240d7f540bd4a5af4e229d00f", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.6297746080745953, "ground_truth": 0}, {"key": "708c903fbf6a7c3c84f84ff34496eb0cb51f44e4", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.8068526300772936, "ground_truth": 0}, {"key": "708c903fbf6a7c3c84f84ff34496eb0cb51f44e4", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.7853085983177508, "ground_truth": 0}, {"key": "708c903fbf6a7c3c84f84ff34496eb0cb51f44e4", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.9118099586787605, "ground_truth": 0}, {"key": "708c903fbf6a7c3c84f84ff34496eb0cb51f44e4", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.6636689691527317, "ground_truth": 0}, {"key": "708c903fbf6a7c3c84f84ff34496eb0cb51f44e4", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.5602526607251017, "ground_truth": 0}, {"key": "26a1bafbde5cc970d5aee024dc8ef418587018a9", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.5253687971823414, "ground_truth": 0}, {"key": "26a1bafbde5cc970d5aee024dc8ef418587018a9", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.5774953502903724, "ground_truth": 0}, {"key": "26a1bafbde5cc970d5aee024dc8ef418587018a9", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.49023561088625495, "ground_truth": 0}, {"key": "26a1bafbde5cc970d5aee024dc8ef418587018a9", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.6943026953081077, "ground_truth": 0}, {"key": "26a1bafbde5cc970d5aee024dc8ef418587018a9", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.82671179347672, "ground_truth": 0}, {"key": "6832312991fe5d87d0e300374ec7a699a921f06a", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.5409238646283664, "ground_truth": 0}, {"key": "6832312991fe5d87d0e300374ec7a699a921f06a", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.7799928996821168, "ground_truth": 0}, {"key": "6832312991fe5d87d0e300374ec7a699a921f06a", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.702530047394498, "ground_truth": 0}, {"key": "6832312991fe5d87d0e300374ec7a699a921f06a", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.4513265008892888, "ground_truth": 0}, {"key": "6832312991fe5d87d0e300374ec7a699a921f06a", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.8459424289890586, "ground_truth": 0}, {"key": "9c5d5d672c2549a594b801897a27dde1492e11d5", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.6959583394801675, "ground_truth": 0}, {"key": "9c5d5d672c2549a594b801897a27dde1492e11d5", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.579400411783648, "ground_truth": 0}, {"key": "9c5d5d672c2549a594b801897a27dde1492e11d5", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.7490871940615038, "ground_truth": 0}, {"key": "9c5d5d672c2549a594b801897a27dde1492e11d5", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.7866228206472494, "ground_truth": 0}, {"key": "9c5d5d672c2549a594b801897a27dde1492e11d5", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.7386690622378715, "ground_truth": 0}, {"key": "c32fa9084fe8cd565890a940794e505d5f7ba4c2", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.7490872050506823, "ground_truth": 0}, {"key": "c32fa9084fe8cd565890a940794e505d5f7ba4c2", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.40168781830920036, "ground_truth": 0}, {"key": "c32fa9084fe8cd565890a940794e505d5f7ba4c2", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.6513548810593321, "ground_truth": 0}, {"key": "c32fa9084fe8cd565890a940794e505d5f7ba4c2", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.47852882139959585, "ground_truth": 0}, {"key": "c32fa9084fe8cd565890a940794e505d5f7ba4c2", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.5736783852403335, "ground_truth": 0}, {"key": "41b5dd6064864c16fbde9b46d37c9f7d9a56e705", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.6388352629595777, "ground_truth": 0}, {"key": "41b5dd6064864c16fbde9b46d37c9f7d9a56e705", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.6825737575058225, "ground_truth": 0}, {"key": "41b5dd6064864c16fbde9b46d37c9f7d9a56e705", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.6388353066516714, "ground_truth": 0}, {"key": "41b5dd6064864c16fbde9b46d37c9f7d9a56e705", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.33633103255655744, "ground_truth": 0}, {"key": "41b5dd6064864c16fbde9b46d37c9f7d9a56e705", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.4301473539876018, "ground_truth": 0}, {"key": "b2d3ba739af767da7aa25c3ba8e1d186168c3394", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.9445872081515284, "ground_truth": 0}, {"key": "b2d3ba739af767da7aa25c3ba8e1d186168c3394", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.8679338486986284, "ground_truth": 0}, {"key": "b2d3ba739af767da7aa25c3ba8e1d186168c3394", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.8278281540644985, "ground_truth": 0}, {"key": "b2d3ba739af767da7aa25c3ba8e1d186168c3394", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.8879840471538687, "ground_truth": 0}, {"key": "b2d3ba739af767da7aa25c3ba8e1d186168c3394", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.840782592169232, "ground_truth": 0}, {"key": "519fd9b5c5ca82979cdfee3c990c3590838d93c7", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.46295861960756673, "ground_truth": 0}, {"key": "519fd9b5c5ca82979cdfee3c990c3590838d93c7", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.7786493140942977, "ground_truth": 0}, {"key": "519fd9b5c5ca82979cdfee3c990c3590838d93c7", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.27048023564560175, "ground_truth": 0}, {"key": "519fd9b5c5ca82979cdfee3c990c3590838d93c7", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.4921881319585773, "ground_truth": 0}, {"key": "519fd9b5c5ca82979cdfee3c990c3590838d93c7", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.29259529917800803, "ground_truth": 0}, {"key": "60f518dff20b2936b104035b1fd9584dd7d16def", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.6548947282719988, "ground_truth": 0}, {"key": "60f518dff20b2936b104035b1fd9584dd7d16def", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.6020616092065406, "ground_truth": 0}, {"key": "60f518dff20b2936b104035b1fd9584dd7d16def", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.4551986146476647, "ground_truth": 0}, {"key": "60f518dff20b2936b104035b1fd9584dd7d16def", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.6531269303285835, "ground_truth": 0}, {"key": "60f518dff20b2936b104035b1fd9584dd7d16def", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.6169358401173216, "ground_truth": 0}, {"key": "b82546b760716f0a2b26606b07af0fe0dd61d6ff", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.32766829672981124, "ground_truth": 0}, {"key": "b82546b760716f0a2b26606b07af0fe0dd61d6ff", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.4244119740862855, "ground_truth": 0}, {"key": "b82546b760716f0a2b26606b07af0fe0dd61d6ff", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.38306419773535466, "ground_truth": 0}, {"key": "b82546b760716f0a2b26606b07af0fe0dd61d6ff", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.38491214964696985, "ground_truth": 0}, {"key": "b82546b760716f0a2b26606b07af0fe0dd61d6ff", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.6020615880116622, "ground_truth": 0}, {"key": "7990fde4a924299fab79f6c8e2b447ee5ffcd1fc", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.17895590427633287, "ground_truth": 0}, {"key": "7990fde4a924299fab79f6c8e2b447ee5ffcd1fc", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.2056150535454948, "ground_truth": 0}, {"key": "7990fde4a924299fab79f6c8e2b447ee5ffcd1fc", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.13939637680529962, "ground_truth": 0}, {"key": "7990fde4a924299fab79f6c8e2b447ee5ffcd1fc", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.3345894561386113, "ground_truth": 0}, {"key": "7990fde4a924299fab79f6c8e2b447ee5ffcd1fc", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.4111108617483413, "ground_truth": 0}, {"key": "504f6f6e1aea6bb73c728d12a1342faa6828aace", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.9884026380629103, "ground_truth": 0}, {"key": "504f6f6e1aea6bb73c728d12a1342faa6828aace", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.9920620061491194, "ground_truth": 0}, {"key": "504f6f6e1aea6bb73c728d12a1342faa6828aace", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.9919380082789355, "ground_truth": 0}, {"key": "504f6f6e1aea6bb73c728d12a1342faa6828aace", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.9893474886944457, "ground_truth": 0}, {"key": "504f6f6e1aea6bb73c728d12a1342faa6828aace", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.9910145714926799, "ground_truth": 0}, {"key": "ef42653bf9337de184e74be0160b807a41b526fd", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.9885803853563601, "ground_truth": 0}, {"key": "ef42653bf9337de184e74be0160b807a41b526fd", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.9925393567273538, "ground_truth": 0}, {"key": "ef42653bf9337de184e74be0160b807a41b526fd", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.9888419689303177, "ground_truth": 0}, {"key": "ef42653bf9337de184e74be0160b807a41b526fd", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.9782188278258732, "ground_truth": 0}, {"key": "ef42653bf9337de184e74be0160b807a41b526fd", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.9895916867810689, "ground_truth": 0}, {"key": "26d0a5624f3ee7605833c641da5d88e2259b1162", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.6893056050617722, "ground_truth": 0}, {"key": "26d0a5624f3ee7605833c641da5d88e2259b1162", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.6020615738312576, "ground_truth": 0}, {"key": "26d0a5624f3ee7605833c641da5d88e2259b1162", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.7826624795923631, "ground_truth": 0}, {"key": "26d0a5624f3ee7605833c641da5d88e2259b1162", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.6893056076187295, "ground_truth": 0}, {"key": "26d0a5624f3ee7605833c641da5d88e2259b1162", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.5389832069555631, "ground_truth": 0}, {"key": "7e43e9a2c67829721ff9f68147285c579e2c8a70", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.4320633976912306, "ground_truth": 0}, {"key": "7e43e9a2c67829721ff9f68147285c579e2c8a70", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.6001883455996895, "ground_truth": 0}, {"key": "7e43e9a2c67829721ff9f68147285c579e2c8a70", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.46490156868633, "ground_truth": 0}, {"key": "7e43e9a2c67829721ff9f68147285c579e2c8a70", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.3415824816586504, "ground_truth": 0}, {"key": "7e43e9a2c67829721ff9f68147285c579e2c8a70", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.7476159613418367, "ground_truth": 0}, {"key": "2137ee3e39b5c0d12e17bbd1e10eb75495a3a83b", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.17217186075319718, "ground_truth": 0}, {"key": "2137ee3e39b5c0d12e17bbd1e10eb75495a3a83b", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.20055768805800878, "ground_truth": 0}, {"key": "2137ee3e39b5c0d12e17bbd1e10eb75495a3a83b", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.05108274176439961, "ground_truth": 0}, {"key": "2137ee3e39b5c0d12e17bbd1e10eb75495a3a83b", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.06512755042455469, "ground_truth": 0}, {"key": "2137ee3e39b5c0d12e17bbd1e10eb75495a3a83b", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.08210662857007639, "ground_truth": 0}, {"key": "31defcc44013caae59c0bdbcedd16be150413bd5", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.6825737533927714, "ground_truth": 0}, {"key": "31defcc44013caae59c0bdbcedd16be150413bd5", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.7690802336300251, "ground_truth": 0}, {"key": "31defcc44013caae59c0bdbcedd16be150413bd5", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.7041601221876294, "ground_truth": 0}, {"key": "31defcc44013caae59c0bdbcedd16be150413bd5", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.609524192756862, "ground_truth": 0}, {"key": "31defcc44013caae59c0bdbcedd16be150413bd5", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.5273165290481113, "ground_truth": 0}, {"key": "db73dc3466e4e92672d716c1eb2ac9430ac69951", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.8955226869776646, "ground_truth": 0}, {"key": "db73dc3466e4e92672d716c1eb2ac9430ac69951", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.8864204135142197, "ground_truth": 0}, {"key": "db73dc3466e4e92672d716c1eb2ac9430ac69951", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.8300437687744225, "ground_truth": 0}, {"key": "db73dc3466e4e92672d716c1eb2ac9430ac69951", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.8092759650657746, "ground_truth": 0}, {"key": "db73dc3466e4e92672d716c1eb2ac9430ac69951", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.7341195324043802, "ground_truth": 0}, {"key": "3f6308f2f5b6ccdb89d7b6abe1b9490cc30b8e5f", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.3738758020036889, "ground_truth": 0}, {"key": "3f6308f2f5b6ccdb89d7b6abe1b9490cc30b8e5f", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.29583987343034346, "ground_truth": 0}, {"key": "3f6308f2f5b6ccdb89d7b6abe1b9490cc30b8e5f", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.1581743517573763, "ground_truth": 0}, {"key": "3f6308f2f5b6ccdb89d7b6abe1b9490cc30b8e5f", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.2598256351363341, "ground_truth": 0}, {"key": "3f6308f2f5b6ccdb89d7b6abe1b9490cc30b8e5f", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.30902370453621625, "ground_truth": 0}, {"key": "068d37f7a1ee822245dbf9d0d8ddfc281919d7ee", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.4785288186614747, "ground_truth": 0}, {"key": "068d37f7a1ee822245dbf9d0d8ddfc281919d7ee", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.5525397315157566, "ground_truth": 0}, {"key": "068d37f7a1ee822245dbf9d0d8ddfc281919d7ee", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.5964331668727009, "ground_truth": 0}, {"key": "068d37f7a1ee822245dbf9d0d8ddfc281919d7ee", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.4263215663836812, "ground_truth": 0}, {"key": "068d37f7a1ee822245dbf9d0d8ddfc281919d7ee", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.815232484287813, "ground_truth": 0}, {"key": "bb1e2c23f3fc6edb0ee4bed365cb5567c87a5aa9", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.9278878020019805, "ground_truth": 0}, {"key": "bb1e2c23f3fc6edb0ee4bed365cb5567c87a5aa9", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.8019358149262158, "ground_truth": 0}, {"key": "bb1e2c23f3fc6edb0ee4bed365cb5567c87a5aa9", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.762070125717977, "ground_truth": 0}, {"key": "bb1e2c23f3fc6edb0ee4bed365cb5567c87a5aa9", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.8749346174253788, "ground_truth": 0}, {"key": "bb1e2c23f3fc6edb0ee4bed365cb5567c87a5aa9", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.7371581491113689, "ground_truth": 0}, {"key": "7c72b57e65ddefc77362ed64f7dbc0aebb87ac81", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.9358173588212264, "ground_truth": 0}, {"key": "7c72b57e65ddefc77362ed64f7dbc0aebb87ac81", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.9252299597141176, "ground_truth": 0}, {"key": "7c72b57e65ddefc77362ed64f7dbc0aebb87ac81", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.8539127416307587, "ground_truth": 0}, {"key": "7c72b57e65ddefc77362ed64f7dbc0aebb87ac81", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.913676526962785, "ground_truth": 0}, {"key": "7c72b57e65ddefc77362ed64f7dbc0aebb87ac81", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.9536217901398782, "ground_truth": 0}, {"key": "37a335b36b8d2472825c4624e5449b995726b7a3", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.46101676486378124, "ground_truth": 0}, {"key": "37a335b36b8d2472825c4624e5449b995726b7a3", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.3007455872125596, "ground_truth": 0}, {"key": "37a335b36b8d2472825c4624e5449b995726b7a3", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.18359363628207842, "ground_truth": 0}, {"key": "37a335b36b8d2472825c4624e5449b995726b7a3", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.28457601473268235, "ground_truth": 0}, {"key": "37a335b36b8d2472825c4624e5449b995726b7a3", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.40922078661491823, "ground_truth": 0}, {"key": "da894eb6e5cc104f90ac65e8a124bfcfbfc6578d", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.4436004080504371, "ground_truth": 0}, {"key": "da894eb6e5cc104f90ac65e8a124bfcfbfc6578d", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.6842640217273831, "ground_truth": 0}, {"key": "da894eb6e5cc104f90ac65e8a124bfcfbfc6578d", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.2991051814625894, "ground_truth": 0}, {"key": "da894eb6e5cc104f90ac65e8a124bfcfbfc6578d", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.6279512139386186, "ground_truth": 0}, {"key": "da894eb6e5cc104f90ac65e8a124bfcfbfc6578d", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.5214711583585474, "ground_truth": 0}, {"key": "b7697e424512e656efe5f2aca17bc33cfe0a2b20", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.5506073773663025, "ground_truth": 0}, {"key": "b7697e424512e656efe5f2aca17bc33cfe0a2b20", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.5832033291925023, "ground_truth": 0}, {"key": "b7697e424512e656efe5f2aca17bc33cfe0a2b20", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.5698526545149872, "ground_truth": 0}, {"key": "b7697e424512e656efe5f2aca17bc33cfe0a2b20", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.4902355924550906, "ground_truth": 0}, {"key": "b7697e424512e656efe5f2aca17bc33cfe0a2b20", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.515619899390018, "ground_truth": 0}, {"key": "2292d4348e59aafbe93f3040af23fdff448a6cac", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.7772998506945249, "ground_truth": 0}, {"key": "2292d4348e59aafbe93f3040af23fdff448a6cac", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.871474864633529, "ground_truth": 0}, {"key": "2292d4348e59aafbe93f3040af23fdff448a6cac", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.6688802480690205, "ground_truth": 0}, {"key": "2292d4348e59aafbe93f3040af23fdff448a6cac", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.6584174826469336, "ground_truth": 0}, {"key": "2292d4348e59aafbe93f3040af23fdff448a6cac", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.622459342039205, "ground_truth": 0}, {"key": "8ed7e0c5e15275537f2c1d5d945e95709d7dc6bf", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.505859096280426, "ground_truth": 0}, {"key": "8ed7e0c5e15275537f2c1d5d945e95709d7dc6bf", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.7969253891872464, "ground_truth": 0}, {"key": "8ed7e0c5e15275537f2c1d5d945e95709d7dc6bf", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.5679366112702923, "ground_truth": 0}, {"key": "8ed7e0c5e15275537f2c1d5d945e95709d7dc6bf", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.63341026813815, "ground_truth": 0}, {"key": "8ed7e0c5e15275537f2c1d5d945e95709d7dc6bf", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.6619228553354052, "ground_truth": 0}, {"key": "6b22be31a2cefb2fdd302b8ff788335f23f5dbad", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.5794004100742083, "ground_truth": 0}, {"key": "6b22be31a2cefb2fdd302b8ff788335f23f5dbad", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.7401743665296235, "ground_truth": 0}, {"key": "6b22be31a2cefb2fdd302b8ff788335f23f5dbad", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.5350984274098055, "ground_truth": 0}, {"key": "6b22be31a2cefb2fdd302b8ff788335f23f5dbad", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.6388352675525639, "ground_truth": 0}, {"key": "6b22be31a2cefb2fdd302b8ff788335f23f5dbad", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.7416740201382737, "ground_truth": 0}, {"key": "686caba1039a286aca406e0bbac00aebb198fda5", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.413003555293572, "ground_truth": 0}, {"key": "686caba1039a286aca406e0bbac00aebb198fda5", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.7759445482753593, "ground_truth": 0}, {"key": "686caba1039a286aca406e0bbac00aebb198fda5", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.49609384478943386, "ground_truth": 0}, {"key": "686caba1039a286aca406e0bbac00aebb198fda5", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.5945512930650825, "ground_truth": 0}, {"key": "686caba1039a286aca406e0bbac00aebb198fda5", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.5409238849863337, "ground_truth": 0}, {"key": "3c84e13d5941fdbe626183cdf1dca9b5df6c8f92", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.7606506583734498, "ground_truth": 0}, {"key": "3c84e13d5941fdbe626183cdf1dca9b5df6c8f92", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.7772998418842659, "ground_truth": 0}, {"key": "3c84e13d5941fdbe626183cdf1dca9b5df6c8f92", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.7853085744601991, "ground_truth": 0}, {"key": "3c84e13d5941fdbe626183cdf1dca9b5df6c8f92", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.8984105683623217, "ground_truth": 0}, {"key": "3c84e13d5941fdbe626183cdf1dca9b5df6c8f92", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.8548846451510108, "ground_truth": 0}, {"key": "7f5fd7614f32586747f65545bebba418c3679d12", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.7634837517743845, "ground_truth": 0}, {"key": "7f5fd7614f32586747f65545bebba418c3679d12", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.509764369600455, "ground_truth": 0}, {"key": "7f5fd7614f32586747f65545bebba418c3679d12", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.3611647320752442, "ground_truth": 0}, {"key": "7f5fd7614f32586747f65545bebba418c3679d12", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.2751297343775985, "ground_truth": 0}, {"key": "7f5fd7614f32586747f65545bebba418c3679d12", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.43782351603400715, "ground_truth": 0}, {"key": "186210bbc060c272ff9a2412ec2e711a3e4a5e6e", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.6113819813144477, "ground_truth": 0}, {"key": "186210bbc060c272ff9a2412ec2e711a3e4a5e6e", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.6654105439941514, "ground_truth": 0}, {"key": "186210bbc060c272ff9a2412ec2e711a3e4a5e6e", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.7476159588885082, "ground_truth": 0}, {"key": "186210bbc060c272ff9a2412ec2e711a3e4a5e6e", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.5195213312410032, "ground_truth": 0}, {"key": "186210bbc060c272ff9a2412ec2e711a3e4a5e6e", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.498046900728303, "ground_truth": 0}, {"key": "03392835ea832d7940082c421a21778c70701ff0", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.4882833951116618, "ground_truth": 0}, {"key": "03392835ea832d7940082c421a21778c70701ff0", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.6654105439941514, "ground_truth": 0}, {"key": "03392835ea832d7940082c421a21778c70701ff0", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.64243248901993, "ground_truth": 0}, {"key": "03392835ea832d7940082c421a21778c70701ff0", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.6076631557908037, "ground_truth": 0}, {"key": "03392835ea832d7940082c421a21778c70701ff0", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.5602526496311968, "ground_truth": 0}, {"key": "e2b96982b60cbd10b39c1db4282023d0ac1f3f2a", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.8044059313479801, "ground_truth": 0}, {"key": "e2b96982b60cbd10b39c1db4282023d0ac1f3f2a", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.5214711468836084, "ground_truth": 0}, {"key": "e2b96982b60cbd10b39c1db4282023d0ac1f3f2a", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.5544704469405041, "ground_truth": 0}, {"key": "e2b96982b60cbd10b39c1db4282023d0ac1f3f2a", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.6601723780004287, "ground_truth": 0}, {"key": "e2b96982b60cbd10b39c1db4282023d0ac1f3f2a", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.552539698478232, "ground_truth": 0}, {"key": "31310358d02c98abba71916e8cb4ef7477a2d82a", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.5907791967717978, "ground_truth": 0}, {"key": "31310358d02c98abba71916e8cb4ef7477a2d82a", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.6334102377361467, "ground_truth": 0}, {"key": "31310358d02c98abba71916e8cb4ef7477a2d82a", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.35756749303406726, "ground_truth": 0}, {"key": "31310358d02c98abba71916e8cb4ef7477a2d82a", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.2735744090676501, "ground_truth": 0}, {"key": "31310358d02c98abba71916e8cb4ef7477a2d82a", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.5563995694105466, "ground_truth": 0}, {"key": "ec0e9a0c77bbb4bba73ef5177413c666e691850d", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.7786493114691596, "ground_truth": 0}, {"key": "ec0e9a0c77bbb4bba73ef5177413c666e691850d", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.871474864633529, "ground_truth": 0}, {"key": "ec0e9a0c77bbb4bba73ef5177413c666e691850d", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.3293917130619585, "ground_truth": 0}, {"key": "ec0e9a0c77bbb4bba73ef5177413c666e691850d", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.7662936613653943, "ground_truth": 0}, {"key": "ec0e9a0c77bbb4bba73ef5177413c666e691850d", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.6442251232072921, "ground_truth": 0}, {"key": "02311be4aab97a81d2262963896b975c27f6503d", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.800691987877908, "ground_truth": 0}, {"key": "02311be4aab97a81d2262963896b975c27f6503d", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.9190632854439903, "ground_truth": 0}, {"key": "02311be4aab97a81d2262963896b975c27f6503d", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.860603615063001, "ground_truth": 0}, {"key": "02311be4aab97a81d2262963896b975c27f6503d", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.7676898500938478, "ground_truth": 0}, {"key": "02311be4aab97a81d2262963896b975c27f6503d", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.9046505384028268, "ground_truth": 0}, {"key": "a18b463219c663ef55a0cbbf81ae489cdf877b62", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.9671630458283484, "ground_truth": 0}, {"key": "a18b463219c663ef55a0cbbf81ae489cdf877b62", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.993149520546169, "ground_truth": 0}, {"key": "a18b463219c663ef55a0cbbf81ae489cdf877b62", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.99435809167984, "ground_truth": 0}, {"key": "a18b463219c663ef55a0cbbf81ae489cdf877b62", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.9905142861429095, "ground_truth": 0}, {"key": "a18b463219c663ef55a0cbbf81ae489cdf877b62", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.9852713867744981, "ground_truth": 0}, {"key": "aa966ac9e3611ac2cef8d3fb9ceb3b58c150e238", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.4843800703221934, "ground_truth": 0}, {"key": "aa966ac9e3611ac2cef8d3fb9ceb3b58c150e238", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.6740504949417907, "ground_truth": 0}, {"key": "aa966ac9e3611ac2cef8d3fb9ceb3b58c150e238", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.7106283168571628, "ground_truth": 0}, {"key": "aa966ac9e3611ac2cef8d3fb9ceb3b58c150e238", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.7057850458902467, "ground_truth": 0}, {"key": "aa966ac9e3611ac2cef8d3fb9ceb3b58c150e238", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.49414090700671204, "ground_truth": 0}, {"key": "5215d4e6e945ba390786f1720cc5a8abf92c32fd", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.7577943829150154, "ground_truth": 0}, {"key": "5215d4e6e945ba390786f1720cc5a8abf92c32fd", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.7772998481652041, "ground_truth": 0}, {"key": "5215d4e6e945ba390786f1720cc5a8abf92c32fd", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.8376199505736636, "ground_truth": 0}, {"key": "5215d4e6e945ba390786f1720cc5a8abf92c32fd", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.7057850431602857, "ground_truth": 0}, {"key": "5215d4e6e945ba390786f1720cc5a8abf92c32fd", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.8006920170175139, "ground_truth": 0}, {"key": "e7297f59909379c8eb07ea9bc2377b5e3980073d", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.24220563242750145, "ground_truth": 0}, {"key": "e7297f59909379c8eb07ea9bc2377b5e3980073d", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.3007455872125596, "ground_truth": 0}, {"key": "e7297f59909379c8eb07ea9bc2377b5e3980073d", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.46684560686337156, "ground_truth": 0}, {"key": "e7297f59909379c8eb07ea9bc2377b5e3980073d", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.28298812679461877, "ground_truth": 0}, {"key": "e7297f59909379c8eb07ea9bc2377b5e3980073d", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.40922078661491823, "ground_truth": 0}, {"key": "6c5f775006a225e617c1fa4cf0c439579e1443a2", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.7549149865031916, "ground_truth": 0}, {"key": "6c5f775006a225e617c1fa4cf0c439579e1443a2", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.9273632986484367, "ground_truth": 0}, {"key": "6c5f775006a225e617c1fa4cf0c439579e1443a2", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.854884643552643, "ground_truth": 0}, {"key": "6c5f775006a225e617c1fa4cf0c439579e1443a2", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.8969755801049298, "ground_truth": 0}, {"key": "6c5f775006a225e617c1fa4cf0c439579e1443a2", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.823328402008614, "ground_truth": 0}, {"key": "46ce664a42eac4474d25c435a28790ec25137603", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.7371581701270075, "ground_truth": 0}, {"key": "46ce664a42eac4474d25c435a28790ec25137603", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.8311430488559605, "ground_truth": 0}, {"key": "46ce664a42eac4474d25c435a28790ec25137603", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.6859494798734411, "ground_truth": 0}, {"key": "46ce664a42eac4474d25c435a28790ec25137603", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.7892337067302883, "ground_truth": 0}, {"key": "46ce664a42eac4474d25c435a28790ec25137603", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.8164063745627499, "ground_truth": 0}, {"key": "693d73ab049f7d8f3c897922b3f7269a96a1a4fa", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.7090191346747226, "ground_truth": 0}, {"key": "693d73ab049f7d8f3c897922b3f7269a96a1a4fa", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.8221891345940374, "ground_truth": 0}, {"key": "693d73ab049f7d8f3c897922b3f7269a96a1a4fa", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.7620701337706353, "ground_truth": 0}, {"key": "693d73ab049f7d8f3c897922b3f7269a96a1a4fa", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.7577943786289867, "ground_truth": 0}, {"key": "693d73ab049f7d8f3c897922b3f7269a96a1a4fa", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.6334102411100132, "ground_truth": 0}, {"key": "48e4930e3c380330b609f460f11520be0e29d5fd", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.6424324899867262, "ground_truth": 0}, {"key": "48e4930e3c380330b609f460f11520be0e29d5fd", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.6636689525009918, "ground_truth": 0}, {"key": "48e4930e3c380330b609f460f11520be0e29d5fd", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.4244120043569731, "ground_truth": 0}, {"key": "48e4930e3c380330b609f460f11520be0e29d5fd", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.7122321572026318, "ground_truth": 0}, {"key": "48e4930e3c380330b609f460f11520be0e29d5fd", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.8397339609802619, "ground_truth": 0}, {"key": "53f3e11ada213ff55b987692a2eb0c9b6d890d5e", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.7826624813645382, "ground_truth": 0}, {"key": "53f3e11ada213ff55b987692a2eb0c9b6d890d5e", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.6706082959377246, "ground_truth": 0}, {"key": "53f3e11ada213ff55b987692a2eb0c9b6d890d5e", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.5926665993927301, "ground_truth": 0}, {"key": "53f3e11ada213ff55b987692a2eb0c9b6d890d5e", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.7138307682534403, "ground_truth": 0}, {"key": "53f3e11ada213ff55b987692a2eb0c9b6d890d5e", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.8068526319444197, "ground_truth": 0}, {"key": "d2ee859acf7e35bea229f968d53240c2f1c2845c", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.8210441172651928, "ground_truth": 0}, {"key": "d2ee859acf7e35bea229f968d53240c2f1c2845c", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.8056321943622533, "ground_truth": 0}, {"key": "d2ee859acf7e35bea229f968d53240c2f1c2845c", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.5926666007478486, "ground_truth": 0}, {"key": "d2ee859acf7e35bea229f968d53240c2f1c2845c", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.913058341424306, "ground_truth": 0}, {"key": "d2ee859acf7e35bea229f968d53240c2f1c2845c", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.5370414182025665, "ground_truth": 0}, {"key": "d4d44650eb77504fd01a730c0ccc7e6cdfcc578a", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.6020615817517706, "ground_truth": 0}, {"key": "d4d44650eb77504fd01a730c0ccc7e6cdfcc578a", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.7386690722644313, "ground_truth": 0}, {"key": "d4d44650eb77504fd01a730c0ccc7e6cdfcc578a", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.7718435001299125, "ground_truth": 0}, {"key": "d4d44650eb77504fd01a730c0ccc7e6cdfcc578a", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.7401743464786635, "ground_truth": 0}, {"key": "d4d44650eb77504fd01a730c0ccc7e6cdfcc578a", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.5544704622206281, "ground_truth": 0}, {"key": "3695132378151f89d210da575bfef0a3f29aa051", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.871474857429617, "ground_truth": 0}, {"key": "3695132378151f89d210da575bfef0a3f29aa051", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.8840392855498206, "ground_truth": 0}, {"key": "3695132378151f89d210da575bfef0a3f29aa051", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.9481545372729991, "ground_truth": 0}, {"key": "3695132378151f89d210da575bfef0a3f29aa051", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.9403530600349174, "ground_truth": 0}, {"key": "3695132378151f89d210da575bfef0a3f29aa051", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.8807970770820893, "ground_truth": 0}, {"key": "c193cecd478fa204b16500ece25bf25b75bc5265", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.6187804412423888, "ground_truth": 0}, {"key": "c193cecd478fa204b16500ece25bf25b75bc5265", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.5214711762811495, "ground_truth": 0}, {"key": "c193cecd478fa204b16500ece25bf25b75bc5265", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.527316549371278, "ground_truth": 0}, {"key": "c193cecd478fa204b16500ece25bf25b75bc5265", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.4205995640003013, "ground_truth": 0}, {"key": "c193cecd478fa204b16500ece25bf25b75bc5265", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.6279512236009562, "ground_truth": 0}, {"key": "b599d61b0c28b86dc92c7af4d40814ece8279500", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.8104789070273517, "ground_truth": 0}, {"key": "b599d61b0c28b86dc92c7af4d40814ece8279500", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.7577943804672548, "ground_truth": 0}, {"key": "b599d61b0c28b86dc92c7af4d40814ece8279500", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.830043771108858, "ground_truth": 0}, {"key": "b599d61b0c28b86dc92c7af4d40814ece8279500", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.7745833934264974, "ground_truth": 0}, {"key": "b599d61b0c28b86dc92c7af4d40814ece8279500", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.5832033717333229, "ground_truth": 0}, {"key": "06f290a163e81c46437ca61b5fd13741d7db11f2", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.29259532301417945, "ground_truth": 0}, {"key": "06f290a163e81c46437ca61b5fd13741d7db11f2", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.3040416848248911, "ground_truth": 0}, {"key": "06f290a163e81c46437ca61b5fd13741d7db11f2", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.3960681532280807, "ground_truth": 0}, {"key": "06f290a163e81c46437ca61b5fd13741d7db11f2", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.35756751879565446, "ground_truth": 0}, {"key": "06f290a163e81c46437ca61b5fd13741d7db11f2", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.35577487928949897, "ground_truth": 0}, {"key": "46210bd0b15cd5bba64751d873674766decb2677", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.804405894388804, "ground_truth": 0}, {"key": "46210bd0b15cd5bba64751d873674766decb2677", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.8732148330312741, "ground_truth": 0}, {"key": "46210bd0b15cd5bba64751d873674766decb2677", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.6169358104858845, "ground_truth": 0}, {"key": "46210bd0b15cd5bba64751d873674766decb2677", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.7264256050893713, "ground_truth": 0}, {"key": "46210bd0b15cd5bba64751d873674766decb2677", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.713830763242368, "ground_truth": 0}, {"key": "cfba701dad16c47e0f7b97b8a6b043d25f740085", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.6039318214338494, "ground_truth": 0}, {"key": "cfba701dad16c47e0f7b97b8a6b043d25f740085", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.4571367310598633, "ground_truth": 0}, {"key": "cfba701dad16c47e0f7b97b8a6b043d25f740085", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.5907792107308356, "ground_truth": 0}, {"key": "cfba701dad16c47e0f7b97b8a6b043d25f740085", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.7295197735677276, "ground_truth": 0}, {"key": "cfba701dad16c47e0f7b97b8a6b043d25f740085", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.45132654022622565, "ground_truth": 0}, {"key": "1c0fbe7e6758334d83d145580688e7aa1c549c53", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.5156199326145838, "ground_truth": 0}, {"key": "1c0fbe7e6758334d83d145580688e7aa1c549c53", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.3140505613586864, "ground_truth": 0}, {"key": "1c0fbe7e6758334d83d145580688e7aa1c549c53", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.5774953762566032, "ground_truth": 0}, {"key": "1c0fbe7e6758334d83d145580688e7aa1c549c53", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.3504213714683869, "ground_truth": 0}, {"key": "1c0fbe7e6758334d83d145580688e7aa1c549c53", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.6020616106778436, "ground_truth": 0}, {"key": "820c917dada8b32be365eaeec9edc1ca5833cfcd", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.7704647887284825, "ground_truth": 0}, {"key": "820c917dada8b32be365eaeec9edc1ca5833cfcd", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.6334102580643609, "ground_truth": 0}, {"key": "820c917dada8b32be365eaeec9edc1ca5833cfcd", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.8255897151381515, "ground_truth": 0}, {"key": "820c917dada8b32be365eaeec9edc1ca5833cfcd", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.729519789356422, "ground_truth": 0}, {"key": "820c917dada8b32be365eaeec9edc1ca5833cfcd", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.7520126015969685, "ground_truth": 0}, {"key": "faf3821150b0c63290cbbddd7a8b54900995ea5a", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.41111084848728274, "ground_truth": 0}, {"key": "faf3821150b0c63290cbbddd7a8b54900995ea5a", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.6774740188482069, "ground_truth": 0}, {"key": "faf3821150b0c63290cbbddd7a8b54900995ea5a", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.5583270115914652, "ground_truth": 0}, {"key": "faf3821150b0c63290cbbddd7a8b54900995ea5a", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.5621765000725805, "ground_truth": 0}, {"key": "faf3821150b0c63290cbbddd7a8b54900995ea5a", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.6224593426204338, "ground_truth": 0}, {"key": "1de0cae2832cf41f49e6fad8254247c789dfabd2", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.49609381259564367, "ground_truth": 0}, {"key": "1de0cae2832cf41f49e6fad8254247c789dfabd2", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.7025300738009539, "ground_truth": 0}, {"key": "1de0cae2832cf41f49e6fad8254247c789dfabd2", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.778649295658102, "ground_truth": 0}, {"key": "1de0cae2832cf41f49e6fad8254247c789dfabd2", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.4493926382154846, "ground_truth": 0}, {"key": "1de0cae2832cf41f49e6fad8254247c789dfabd2", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.5794004020514737, "ground_truth": 0}, {"key": "6c6e51ef20def117ed9114ed8d8480b3a100f1c3", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.8164063736769254, "ground_truth": 0}, {"key": "6c6e51ef20def117ed9114ed8d8480b3a100f1c3", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.8633916042865943, "ground_truth": 0}, {"key": "6c6e51ef20def117ed9114ed8d8480b3a100f1c3", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.592666588750383, "ground_truth": 0}, {"key": "6c6e51ef20def117ed9114ed8d8480b3a100f1c3", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.7233094729123366, "ground_truth": 0}, {"key": "6c6e51ef20def117ed9114ed8d8480b3a100f1c3", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.7401743839234355, "ground_truth": 0}, {"key": "b8c755b8921f7917d161605d2ef404d9551f3846", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.5544704561503938, "ground_truth": 0}, {"key": "b8c755b8921f7917d161605d2ef404d9551f3846", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.3208213150434547, "ground_truth": 0}, {"key": "b8c755b8921f7917d161605d2ef404d9551f3846", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.38861802626204917, "ground_truth": 0}, {"key": "b8c755b8921f7917d161605d2ef404d9551f3846", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.6601723724405906, "ground_truth": 0}, {"key": "b8c755b8921f7917d161605d2ef404d9551f3846", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.713830744063341, "ground_truth": 0}, {"key": "dc7e18d14b8ad29abbd79f554324ec7b8ba8b9c0", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.7563575547576376, "ground_truth": 0}, {"key": "dc7e18d14b8ad29abbd79f554324ec7b8ba8b9c0", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.8164063923217189, "ground_truth": 0}, {"key": "dc7e18d14b8ad29abbd79f554324ec7b8ba8b9c0", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.7892337181220845, "ground_truth": 0}, {"key": "dc7e18d14b8ad29abbd79f554324ec7b8ba8b9c0", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.7264256103519351, "ground_truth": 0}, {"key": "dc7e18d14b8ad29abbd79f554324ec7b8ba8b9c0", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.7341195320659065, "ground_truth": 0}, {"key": "a7fc90db6c296663b1b7fc057451dfd45019342d", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.47073661021325214, "ground_truth": 0}, {"key": "a7fc90db6c296663b1b7fc057451dfd45019342d", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.7356416298881989, "ground_truth": 0}, {"key": "a7fc90db6c296663b1b7fc057451dfd45019342d", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.31405056664304953, "ground_truth": 0}, {"key": "a7fc90db6c296663b1b7fc057451dfd45019342d", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.5679366388390089, "ground_truth": 0}, {"key": "a7fc90db6c296663b1b7fc057451dfd45019342d", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.44552951928732487, "ground_truth": 0}, {"key": "7f22fbc4fd81e50c632c5853856965aa4d0065d4", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.8615382117056419, "ground_truth": 0}, {"key": "7f22fbc4fd81e50c632c5853856965aa4d0065d4", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.9559813467331042, "ground_truth": 0}, {"key": "7f22fbc4fd81e50c632c5853856965aa4d0065d4", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.8499711843013599, "ground_truth": 0}, {"key": "7f22fbc4fd81e50c632c5853856965aa4d0065d4", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.8661325035761609, "ground_truth": 0}, {"key": "7f22fbc4fd81e50c632c5853856965aa4d0065d4", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.9372107924776167, "ground_truth": 0}, {"key": "309ae632df7b88a9569d81fa91aff3b9fb03529e", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.7138307375261242, "ground_truth": 0}, {"key": "309ae632df7b88a9569d81fa91aff3b9fb03529e", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.5794004014379946, "ground_truth": 0}, {"key": "309ae632df7b88a9569d81fa91aff3b9fb03529e", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.7592254065962771, "ground_truth": 0}, {"key": "309ae632df7b88a9569d81fa91aff3b9fb03529e", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.6740504584531208, "ground_truth": 0}, {"key": "309ae632df7b88a9569d81fa91aff3b9fb03529e", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.560252658427729, "ground_truth": 0}, {"key": "732304a0901ff14d023d4361c1d41a85724808f3", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.4244119786390743, "ground_truth": 0}, {"key": "732304a0901ff14d023d4361c1d41a85724808f3", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.7325918320560174, "ground_truth": 0}, {"key": "732304a0901ff14d023d4361c1d41a85724808f3", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.567936639054785, "ground_truth": 0}, {"key": "732304a0901ff14d023d4361c1d41a85724808f3", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.6406358604441593, "ground_truth": 0}, {"key": "732304a0901ff14d023d4361c1d41a85724808f3", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.6020616128692116, "ground_truth": 0}, {"key": "509b9f69b376e4acb8da49d53198699b1e779ea7", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.4513264864643475, "ground_truth": 0}, {"key": "509b9f69b376e4acb8da49d53198699b1e779ea7", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.7634837584033725, "ground_truth": 0}, {"key": "509b9f69b376e4acb8da49d53198699b1e779ea7", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.594551265386606, "ground_truth": 0}, {"key": "509b9f69b376e4acb8da49d53198699b1e779ea7", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.6169358063588687, "ground_truth": 0}, {"key": "509b9f69b376e4acb8da49d53198699b1e779ea7", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.5794004121710279, "ground_truth": 0}, {"key": "c292860b41f7c9131458cdc44a79febef38ad8a2", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.8322366469296077, "ground_truth": 0}, {"key": "c292860b41f7c9131458cdc44a79febef38ad8a2", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.8407825803680947, "ground_truth": 0}, {"key": "c292860b41f7c9131458cdc44a79febef38ad8a2", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.6315943186124857, "ground_truth": 0}, {"key": "c292860b41f7c9131458cdc44a79febef38ad8a2", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.8548846392550433, "ground_truth": 0}, {"key": "c292860b41f7c9131458cdc44a79febef38ad8a2", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.8766343688203003, "ground_truth": 0}, {"key": "6db7e70883f0241081833487c421bab86fdac26e", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.7416739854768815, "ground_truth": 0}, {"key": "6db7e70883f0241081833487c421bab86fdac26e", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.6992544248246696, "ground_truth": 0}, {"key": "6db7e70883f0241081833487c421bab86fdac26e", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.7138307464924617, "ground_truth": 0}, {"key": "6db7e70883f0241081833487c421bab86fdac26e", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.6842640353816422, "ground_truth": 0}, {"key": "6db7e70883f0241081833487c421bab86fdac26e", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.8244619276851841, "ground_truth": 0}, {"key": "e51e06234b3f49da16fec69aaee6fb9cd09cb1d8", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.8459424380419003, "ground_truth": 0}, {"key": "e51e06234b3f49da16fec69aaee6fb9cd09cb1d8", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.8365545578386896, "ground_truth": 0}, {"key": "e51e06234b3f49da16fec69aaee6fb9cd09cb1d8", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.8976952995439538, "ground_truth": 0}, {"key": "e51e06234b3f49da16fec69aaee6fb9cd09cb1d8", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.45907612248035323, "ground_truth": 0}, {"key": "e51e06234b3f49da16fec69aaee6fb9cd09cb1d8", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.7969253762007434, "ground_truth": 0}, {"key": "42474528588bac3a27842671a3fa940fed450552", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.7138307877228333, "ground_truth": 0}, {"key": "42474528588bac3a27842671a3fa940fed450552", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.5312093896583207, "ground_truth": 0}, {"key": "42474528588bac3a27842671a3fa940fed450552", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.6706082890596978, "ground_truth": 0}, {"key": "42474528588bac3a27842671a3fa940fed450552", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.735641658703032, "ground_truth": 0}, {"key": "42474528588bac3a27842671a3fa940fed450552", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.5583270293010645, "ground_truth": 0}, {"key": "5932d9c8f1da55bad396197ebae0853c515180a5", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.6959583165545177, "ground_truth": 0}, {"key": "5932d9c8f1da55bad396197ebae0853c515180a5", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.4436004404715703, "ground_truth": 0}, {"key": "5932d9c8f1da55bad396197ebae0853c515180a5", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.5983122130560142, "ground_truth": 0}, {"key": "5932d9c8f1da55bad396197ebae0853c515180a5", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.21733751339155627, "ground_truth": 0}, {"key": "5932d9c8f1da55bad396197ebae0853c515180a5", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.6001883506849296, "ground_truth": 0}, {"key": "daacc676fc659bfd147d11b1409ab42615a2f169", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.38491214874944857, "ground_truth": 0}, {"key": "daacc676fc659bfd147d11b1409ab42615a2f169", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.789233711555138, "ground_truth": 0}, {"key": "daacc676fc659bfd147d11b1409ab42615a2f169", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.546738159698508, "ground_truth": 0}, {"key": "daacc676fc659bfd147d11b1409ab42615a2f169", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.6477982420733613, "ground_truth": 0}, {"key": "daacc676fc659bfd147d11b1409ab42615a2f169", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.6909762785087865, "ground_truth": 0}, {"key": "7a02e707b139791920fb13115d6132541fff7d97", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.5888891441416678, "ground_truth": 0}, {"key": "7a02e707b139791920fb13115d6132541fff7d97", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.6842640289886082, "ground_truth": 0}, {"key": "7a02e707b139791920fb13115d6132541fff7d97", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.5409238907099428, "ground_truth": 0}, {"key": "7a02e707b139791920fb13115d6132541fff7d97", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.46295862226296125, "ground_truth": 0}, {"key": "7a02e707b139791920fb13115d6132541fff7d97", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.6548947064350692, "ground_truth": 0}, {"key": "db1972f0204c7a9c292f4c85e8838251cb26625e", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.5058590917159596, "ground_truth": 0}, {"key": "db1972f0204c7a9c292f4c85e8838251cb26625e", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.6495786278083425, "ground_truth": 0}, {"key": "db1972f0204c7a9c292f4c85e8838251cb26625e", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.6076631551734073, "ground_truth": 0}, {"key": "db1972f0204c7a9c292f4c85e8838251cb26625e", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.8128673188934048, "ground_truth": 0}, {"key": "db1972f0204c7a9c292f4c85e8838251cb26625e", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.6893056306315172, "ground_truth": 0}, {"key": "6defcdfd6995661fd681dc15163d67f6a5d6727b", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.8740772264809406, "ground_truth": 0}, {"key": "6defcdfd6995661fd681dc15163d67f6a5d6727b", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.44552951487826914, "ground_truth": 0}, {"key": "6defcdfd6995661fd681dc15163d67f6a5d6727b", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.737158185793624, "ground_truth": 0}, {"key": "6defcdfd6995661fd681dc15163d67f6a5d6727b", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.7620701129029238, "ground_truth": 0}, {"key": "6defcdfd6995661fd681dc15163d67f6a5d6727b", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.8459424372073064, "ground_truth": 0}, {"key": "24716f5a39d23dafbe9a9df8fa002788d14d020b", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.5312093636013072, "ground_truth": 0}, {"key": "24716f5a39d23dafbe9a9df8fa002788d14d020b", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.64957861556505, "ground_truth": 0}, {"key": "24716f5a39d23dafbe9a9df8fa002788d14d020b", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.4130035799223757, "ground_truth": 0}, {"key": "24716f5a39d23dafbe9a9df8fa002788d14d020b", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.7620700975848154, "ground_truth": 0}, {"key": "24716f5a39d23dafbe9a9df8fa002788d14d020b", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.5698526515390505, "ground_truth": 0}, {"key": "ab3c98cf7833b842898a568d872e45ceb2f7dda9", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.6909762727873977, "ground_truth": 0}, {"key": "ab3c98cf7833b842898a568d872e45ceb2f7dda9", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.7461390142156654, "ground_truth": 0}, {"key": "ab3c98cf7833b842898a568d872e45ceb2f7dda9", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.4130035837916211, "ground_truth": 0}, {"key": "ab3c98cf7833b842898a568d872e45ceb2f7dda9", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.7310585665555677, "ground_truth": 0}, {"key": "ab3c98cf7833b842898a568d872e45ceb2f7dda9", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.6808786414360594, "ground_truth": 0}, {"key": "831005755f85012c882f17c3b3699b34a7febb7b", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.825589726532878, "ground_truth": 0}, {"key": "831005755f85012c882f17c3b3699b34a7febb7b", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.8333245980781114, "ground_truth": 0}, {"key": "831005755f85012c882f17c3b3699b34a7febb7b", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.8783142401272123, "ground_truth": 0}, {"key": "831005755f85012c882f17c3b3699b34a7febb7b", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.8164063742079936, "ground_truth": 0}, {"key": "831005755f85012c882f17c3b3699b34a7febb7b", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.8791467721448141, "ground_truth": 0}, {"key": "0590a8c653b7d332d9df195dcf3ce014abb4eff7", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.7981867658088406, "ground_truth": 0}, {"key": "0590a8c653b7d332d9df195dcf3ce014abb4eff7", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.6688802684513562, "ground_truth": 0}, {"key": "0590a8c653b7d332d9df195dcf3ce014abb4eff7", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.86060362287402, "ground_truth": 0}, {"key": "0590a8c653b7d332d9df195dcf3ce014abb4eff7", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.7325918359341387, "ground_truth": 0}, {"key": "0590a8c653b7d332d9df195dcf3ce014abb4eff7", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.7759445356646262, "ground_truth": 0}, {"key": "f79341438eed40986c3219b67a3b5d87eb6c018a", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.9433475726495365, "ground_truth": 0}, {"key": "f79341438eed40986c3219b67a3b5d87eb6c018a", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.9453993961953289, "ground_truth": 0}, {"key": "f79341438eed40986c3219b67a3b5d87eb6c018a", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.9753900705605815, "ground_truth": 0}, {"key": "f79341438eed40986c3219b67a3b5d87eb6c018a", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.9626731132436693, "ground_truth": 0}, {"key": "f79341438eed40986c3219b67a3b5d87eb6c018a", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.9651191108443142, "ground_truth": 0}, {"key": "8db6225f67580d64a196f2f3197386a6be950a09", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.9761291648614615, "ground_truth": 0}, {"key": "8db6225f67580d64a196f2f3197386a6be950a09", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.9588471102767276, "ground_truth": 0}, {"key": "8db6225f67580d64a196f2f3197386a6be950a09", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.9224823466750102, "ground_truth": 0}, {"key": "8db6225f67580d64a196f2f3197386a6be950a09", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.9005297926772194, "ground_truth": 0}, {"key": "8db6225f67580d64a196f2f3197386a6be950a09", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.9130583438530824, "ground_truth": 0}, {"key": "e386d9ed70bac668fa6048b572f445d9b7b62f75", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.4980468665679542, "ground_truth": 0}, {"key": "e386d9ed70bac668fa6048b572f445d9b7b62f75", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.509764394988879, "ground_truth": 0}, {"key": "e386d9ed70bac668fa6048b572f445d9b7b62f75", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.6619228826037837, "ground_truth": 0}, {"key": "e386d9ed70bac668fa6048b572f445d9b7b62f75", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.6187804456481423, "ground_truth": 0}, {"key": "e386d9ed70bac668fa6048b572f445d9b7b62f75", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.4092207955951866, "ground_truth": 0}, {"key": "e35669d4530ea55bc8f0e451268cab9e9eaeab92", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.6352224606138019, "ground_truth": 0}, {"key": "e35669d4530ea55bc8f0e451268cab9e9eaeab92", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.5717665910017217, "ground_truth": 0}, {"key": "e35669d4530ea55bc8f0e451268cab9e9eaeab92", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.6477981979010075, "ground_truth": 0}, {"key": "e35669d4530ea55bc8f0e451268cab9e9eaeab92", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.7041601220480899, "ground_truth": 0}, {"key": "e35669d4530ea55bc8f0e451268cab9e9eaeab92", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.7563575611774268, "ground_truth": 0}, {"key": "d3ca193f45aef9aa766d52fbc58d6b8f1658ee60", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.3040416881185459, "ground_truth": 0}, {"key": "d3ca193f45aef9aa766d52fbc58d6b8f1658ee60", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.583203346854633, "ground_truth": 0}, {"key": "d3ca193f45aef9aa766d52fbc58d6b8f1658ee60", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.36658973968657066, "ground_truth": 0}, {"key": "d3ca193f45aef9aa766d52fbc58d6b8f1658ee60", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.435901520369614, "ground_truth": 0}, {"key": "d3ca193f45aef9aa766d52fbc58d6b8f1658ee60", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.5350984290029551, "ground_truth": 0}, {"key": "1ca9bf09bf534add02b7cfe6ebae6d17cde66286", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.7956581073100323, "ground_truth": 0}, {"key": "1ca9bf09bf534add02b7cfe6ebae6d17cde66286", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.8895288443270388, "ground_truth": 0}, {"key": "1ca9bf09bf534add02b7cfe6ebae6d17cde66286", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.9416541535100085, "ground_truth": 0}, {"key": "1ca9bf09bf534add02b7cfe6ebae6d17cde66286", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.8558511417074417, "ground_truth": 0}, {"key": "1ca9bf09bf534add02b7cfe6ebae6d17cde66286", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.9623913658628942, "ground_truth": 0}, {"key": "c296e88117bef515bd9b36ad560223df3fd2b84c", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.7606506579550132, "ground_truth": 0}, {"key": "c296e88117bef515bd9b36ad560223df3fd2b84c", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.47463117081519207, "ground_truth": 0}, {"key": "c296e88117bef515bd9b36ad560223df3fd2b84c", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.7041601389222034, "ground_truth": 0}, {"key": "c296e88117bef515bd9b36ad560223df3fd2b84c", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.43974733243992314, "ground_truth": 0}, {"key": "c296e88117bef515bd9b36ad560223df3fd2b84c", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.8624675412222771, "ground_truth": 0}, {"key": "c5e11ee4c2f0ae511bd0e1fae2978d070b1efc15", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.7310586035271476, "ground_truth": 0}, {"key": "c5e11ee4c2f0ae511bd0e1fae2978d070b1efc15", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.754915001114228, "ground_truth": 0}, {"key": "c5e11ee4c2f0ae511bd0e1fae2978d070b1efc15", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.7233094909954694, "ground_truth": 0}, {"key": "c5e11ee4c2f0ae511bd0e1fae2978d070b1efc15", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.7943849524321287, "ground_truth": 0}, {"key": "c5e11ee4c2f0ae511bd0e1fae2978d070b1efc15", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.6442250980305271, "ground_truth": 0}, {"key": "1fc2d1ecf1ffdc2f0b642b686e1c21de53a4fd28", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.5755880057535382, "ground_truth": 0}, {"key": "1fc2d1ecf1ffdc2f0b642b686e1c21de53a4fd28", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.5736784020268784, "ground_truth": 0}, {"key": "1fc2d1ecf1ffdc2f0b642b686e1c21de53a4fd28", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.6791786898603179, "ground_truth": 0}, {"key": "1fc2d1ecf1ffdc2f0b642b686e1c21de53a4fd28", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.46101679457369166, "ground_truth": 0}, {"key": "1fc2d1ecf1ffdc2f0b642b686e1c21de53a4fd28", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.6095241545709139, "ground_truth": 0}, {"key": "6556c64821ece8123c130b27285efe9619c3c7fd", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.5039061561907199, "ground_truth": 0}, {"key": "6556c64821ece8123c130b27285efe9619c3c7fd", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.38491215987757316, "ground_truth": 0}, {"key": "6556c64821ece8123c130b27285efe9619c3c7fd", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.6774740097931974, "ground_truth": 0}, {"key": "6556c64821ece8123c130b27285efe9619c3c7fd", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.5331543791601621, "ground_truth": 0}, {"key": "6556c64821ece8123c130b27285efe9619c3c7fd", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.8019358249384814, "ground_truth": 0}, {"key": "32ba61f4513f7ec21cedb6ddd2a8a93260f8cd56", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.6531269301927649, "ground_truth": 0}, {"key": "32ba61f4513f7ec21cedb6ddd2a8a93260f8cd56", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.8221891389608673, "ground_truth": 0}, {"key": "32ba61f4513f7ec21cedb6ddd2a8a93260f8cd56", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.7799929096436409, "ground_truth": 0}, {"key": "32ba61f4513f7ec21cedb6ddd2a8a93260f8cd56", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.7386690624877771, "ground_truth": 0}, {"key": "32ba61f4513f7ec21cedb6ddd2a8a93260f8cd56", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.834406885885309, "ground_truth": 0}, {"key": "1146cfc5981ce23511ac1bac5f3957c30bebc7b8", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.4843800714069666, "ground_truth": 0}, {"key": "1146cfc5981ce23511ac1bac5f3957c30bebc7b8", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.4320633716733965, "ground_truth": 0}, {"key": "1146cfc5981ce23511ac1bac5f3957c30bebc7b8", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.42441198260270435, "ground_truth": 0}, {"key": "1146cfc5981ce23511ac1bac5f3957c30bebc7b8", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.32252597879030026, "ground_truth": 0}, {"key": "1146cfc5981ce23511ac1bac5f3957c30bebc7b8", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.5621764978394319, "ground_truth": 0}, {"key": "e060abdb2a5e2ce6152ca0ed53703a9d17b2df36", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.6352224321562104, "ground_truth": 0}, {"key": "e060abdb2a5e2ce6152ca0ed53703a9d17b2df36", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.5156199172151308, "ground_truth": 0}, {"key": "e060abdb2a5e2ce6152ca0ed53703a9d17b2df36", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.5136684690242173, "ground_truth": 0}, {"key": "e060abdb2a5e2ce6152ca0ed53703a9d17b2df36", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.2628418528388594, "ground_truth": 0}, {"key": "e060abdb2a5e2ce6152ca0ed53703a9d17b2df36", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.5058591178890225, "ground_truth": 0}, {"key": "aef2a80ff67e87a8c165a481ede2a643128f4aa7", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.8633915989431505, "ground_truth": 0}, {"key": "aef2a80ff67e87a8c165a481ede2a643128f4aa7", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.6424324785473142, "ground_truth": 0}, {"key": "aef2a80ff67e87a8c165a481ede2a643128f4aa7", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.665410557817406, "ground_truth": 0}, {"key": "aef2a80ff67e87a8c165a481ede2a643128f4aa7", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.8428631415475217, "ground_truth": 0}, {"key": "aef2a80ff67e87a8c165a481ede2a643128f4aa7", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.562176496873511, "ground_truth": 0}, {"key": "d4eaedd7f1055f95e9cafa21e870d049f5df8526", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.2436424496740407, "ground_truth": 0}, {"key": "d4eaedd7f1055f95e9cafa21e870d049f5df8526", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.2030746324453847, "ground_truth": 0}, {"key": "d4eaedd7f1055f95e9cafa21e870d049f5df8526", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.2523840488561316, "ground_truth": 0}, {"key": "d4eaedd7f1055f95e9cafa21e870d049f5df8526", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.3539863113054464, "ground_truth": 0}, {"key": "d4eaedd7f1055f95e9cafa21e870d049f5df8526", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.23370634473462343, "ground_truth": 0}, {"key": "ec9531cd58e385f0da60e23b2855a3c5ece3f270", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.4785288339949233, "ground_truth": 0}, {"key": "ec9531cd58e385f0da60e23b2855a3c5ece3f270", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.5389832223277223, "ground_truth": 0}, {"key": "ec9531cd58e385f0da60e23b2855a3c5ece3f270", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.4882833813069066, "ground_truth": 0}, {"key": "ec9531cd58e385f0da60e23b2855a3c5ece3f270", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.3738758183863109, "ground_truth": 0}, {"key": "ec9531cd58e385f0da60e23b2855a3c5ece3f270", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.28937170974123455, "ground_truth": 0}, {"key": "b171bad51c8ec09118fd553347c41d9301f195ee", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.5698526465631626, "ground_truth": 0}, {"key": "b171bad51c8ec09118fd553347c41d9301f195ee", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.6169358264729877, "ground_truth": 0}, {"key": "b171bad51c8ec09118fd553347c41d9301f195ee", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.6601723769114975, "ground_truth": 0}, {"key": "b171bad51c8ec09118fd553347c41d9301f195ee", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.7201714869576514, "ground_truth": 0}, {"key": "b171bad51c8ec09118fd553347c41d9301f195ee", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.5774953659503104, "ground_truth": 0}, {"key": "1df14bd442bd39ed653aa77a1e77105d4b321db0", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.6723317245199858, "ground_truth": 0}, {"key": "1df14bd442bd39ed653aa77a1e77105d4b321db0", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.9053223055391819, "ground_truth": 0}, {"key": "1df14bd442bd39ed653aa77a1e77105d4b321db0", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.8933094071608205, "ground_truth": 0}, {"key": "1df14bd442bd39ed653aa77a1e77105d4b321db0", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.7505527657699004, "ground_truth": 0}, {"key": "1df14bd442bd39ed653aa77a1e77105d4b321db0", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.737158183851712, "ground_truth": 0}, {"key": "d4f57e3c18c38696345fb7a3d76a151bb9c5123b", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.439747334533194, "ground_truth": 0}, {"key": "d4f57e3c18c38696345fb7a3d76a151bb9c5123b", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.35577486861463414, "ground_truth": 0}, {"key": "d4f57e3c18c38696345fb7a3d76a151bb9c5123b", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.5583269815122175, "ground_truth": 0}, {"key": "d4f57e3c18c38696345fb7a3d76a151bb9c5123b", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.4629586343516015, "ground_truth": 0}, {"key": "d4f57e3c18c38696345fb7a3d76a151bb9c5123b", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.7295197778806358, "ground_truth": 0}, {"key": "28bbbf57c580be154f0602cbfe8b63603ef5a3a4", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.6388353039926887, "ground_truth": 0}, {"key": "28bbbf57c580be154f0602cbfe8b63603ef5a3a4", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.31742627392431055, "ground_truth": 0}, {"key": "28bbbf57c580be154f0602cbfe8b63603ef5a3a4", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.4941409053091992, "ground_truth": 0}, {"key": "28bbbf57c580be154f0602cbfe8b63603ef5a3a4", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.3174262808671284, "ground_truth": 0}, {"key": "28bbbf57c580be154f0602cbfe8b63603ef5a3a4", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.4092208155995544, "ground_truth": 0}, {"key": "05850904cabf491c9ab7c0e0d85fd932eb8c0bb0", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.5698526406935706, "ground_truth": 0}, {"key": "05850904cabf491c9ab7c0e0d85fd932eb8c0bb0", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.6297746144965694, "ground_truth": 0}, {"key": "05850904cabf491c9ab7c0e0d85fd932eb8c0bb0", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.3867634283156126, "ground_truth": 0}, {"key": "05850904cabf491c9ab7c0e0d85fd932eb8c0bb0", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.42441200736593543, "ground_truth": 0}, {"key": "05850904cabf491c9ab7c0e0d85fd932eb8c0bb0", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.46490157502001267, "ground_truth": 0}, {"key": "df79c0f955e4ccf51ad45780f865e334d3577bf5", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.44360040626156694, "ground_truth": 0}, {"key": "df79c0f955e4ccf51ad45780f865e334d3577bf5", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.5832033291925023, "ground_truth": 0}, {"key": "df79c0f955e4ccf51ad45780f865e334d3577bf5", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.6791786962018835, "ground_truth": 0}, {"key": "df79c0f955e4ccf51ad45780f865e334d3577bf5", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.6279512271195514, "ground_truth": 0}, {"key": "df79c0f955e4ccf51ad45780f865e334d3577bf5", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.6020615946847281, "ground_truth": 0}, {"key": "ffb8b9be838da033f6f3383f324d425556723147", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.7662936383405831, "ground_truth": 0}, {"key": "ffb8b9be838da033f6f3383f324d425556723147", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.6976089163625715, "ground_truth": 0}, {"key": "ffb8b9be838da033f6f3383f324d425556723147", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.6757646045894168, "ground_truth": 0}, {"key": "ffb8b9be838da033f6f3383f324d425556723147", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.7648915978482784, "ground_truth": 0}, {"key": "ffb8b9be838da033f6f3383f324d425556723147", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.592666605759879, "ground_truth": 0}, {"key": "d70dcffc2c07e08cc121d7126ada53dbc479626e", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.47463115693741387, "ground_truth": 0}, {"key": "d70dcffc2c07e08cc121d7126ada53dbc479626e", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.6842640313482042, "ground_truth": 0}, {"key": "d70dcffc2c07e08cc121d7126ada53dbc479626e", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.7534666465016268, "ground_truth": 0}, {"key": "d70dcffc2c07e08cc121d7126ada53dbc479626e", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.31405055578045155, "ground_truth": 0}, {"key": "d70dcffc2c07e08cc121d7126ada53dbc479626e", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.7549149716622654, "ground_truth": 0}, {"key": "4dc0cef39980df6382f9aee5e150e904fe62965e", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.7549149655692308, "ground_truth": 0}, {"key": "4dc0cef39980df6382f9aee5e150e904fe62965e", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.5350984174710625, "ground_truth": 0}, {"key": "4dc0cef39980df6382f9aee5e150e904fe62965e", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.697608895561021, "ground_truth": 0}, {"key": "4dc0cef39980df6382f9aee5e150e904fe62965e", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.8365545722745339, "ground_truth": 0}, {"key": "4dc0cef39980df6382f9aee5e150e904fe62965e", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.6808786225212513, "ground_truth": 0}, {"key": "6cb082c504e00c93686ff1e9287a84ba13c12b79", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.23651622860895494, "ground_truth": 0}, {"key": "6cb082c504e00c93686ff1e9287a84ba13c12b79", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.4244119945369509, "ground_truth": 0}, {"key": "6cb082c504e00c93686ff1e9287a84ba13c12b79", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.341582495413912, "ground_truth": 0}, {"key": "6cb082c504e00c93686ff1e9287a84ba13c12b79", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.20561504722325671, "ground_truth": 0}, {"key": "6cb082c504e00c93686ff1e9287a84ba13c12b79", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.26740815981981986, "ground_truth": 0}, {"key": "19fe2a8e0bef37b495afcc83c2f46b60c56039bf", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.8479677651011366, "ground_truth": 0}, {"key": "19fe2a8e0bef37b495afcc83c2f46b60c56039bf", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.5117165881012271, "ground_truth": 0}, {"key": "19fe2a8e0bef37b495afcc83c2f46b60c56039bf", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.6406358557711833, "ground_truth": 0}, {"key": "19fe2a8e0bef37b495afcc83c2f46b60c56039bf", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.6774740074959797, "ground_truth": 0}, {"key": "19fe2a8e0bef37b495afcc83c2f46b60c56039bf", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.6113819363740862, "ground_truth": 0}, {"key": "503c6aaeaf0e61372a896ebe1fdf2a2492844fe4", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.7057850321588405, "ground_truth": 0}, {"key": "503c6aaeaf0e61372a896ebe1fdf2a2492844fe4", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.6057990414398249, "ground_truth": 0}, {"key": "503c6aaeaf0e61372a896ebe1fdf2a2492844fe4", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.6774739879002708, "ground_truth": 0}, {"key": "503c6aaeaf0e61372a896ebe1fdf2a2492844fe4", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.6020616022137713, "ground_truth": 0}, {"key": "503c6aaeaf0e61372a896ebe1fdf2a2492844fe4", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.6601723851762934, "ground_truth": 0}, {"key": "e4007135fdafe84907e2b018da3a4c7ab853c251", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.6531269106093605, "ground_truth": 0}, {"key": "e4007135fdafe84907e2b018da3a4c7ab853c251", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.7025300468549646, "ground_truth": 0}, {"key": "e4007135fdafe84907e2b018da3a4c7ab853c251", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.7279754464866884, "ground_truth": 0}, {"key": "e4007135fdafe84907e2b018da3a4c7ab853c251", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.7356416219932128, "ground_truth": 0}, {"key": "e4007135fdafe84907e2b018da3a4c7ab853c251", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.7264256006946936, "ground_truth": 0}, {"key": "5b97a507eed113ce329e8c85078fb53033bbe567", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.2845759979571905, "ground_truth": 0}, {"key": "5b97a507eed113ce329e8c85078fb53033bbe567", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.314050548616567, "ground_truth": 0}, {"key": "5b97a507eed113ce329e8c85078fb53033bbe567", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.49804691084466757, "ground_truth": 0}, {"key": "5b97a507eed113ce329e8c85078fb53033bbe567", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.3225259841037383, "ground_truth": 0}, {"key": "5b97a507eed113ce329e8c85078fb53033bbe567", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.4629585912866534, "ground_truth": 0}, {"key": "145a118e355e3a92383b41307a5b473a7c77a8bb", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.5506073838642324, "ground_truth": 0}, {"key": "145a118e355e3a92383b41307a5b473a7c77a8bb", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.5907791928380607, "ground_truth": 0}, {"key": "145a118e355e3a92383b41307a5b473a7c77a8bb", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.6224593127868192, "ground_truth": 0}, {"key": "145a118e355e3a92383b41307a5b473a7c77a8bb", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.6976089097860101, "ground_truth": 0}, {"key": "145a118e355e3a92383b41307a5b473a7c77a8bb", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.4726834460467077, "ground_truth": 0}, {"key": "1f6309c88c5711b2b579e3c0cf699c44d3b56d16", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.36840570466738476, "ground_truth": 0}, {"key": "1f6309c88c5711b2b579e3c0cf699c44d3b56d16", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.4359015319521641, "ground_truth": 0}, {"key": "1f6309c88c5711b2b579e3c0cf699c44d3b56d16", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.535098434863093, "ground_truth": 0}, {"key": "1f6309c88c5711b2b579e3c0cf699c44d3b56d16", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.304041701681374, "ground_truth": 0}, {"key": "1f6309c88c5711b2b579e3c0cf699c44d3b56d16", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.596433146522155, "ground_truth": 0}, {"key": "d8304c60e76a4b16053e74c50abd886dcdf7397c", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.6279512493630851, "ground_truth": 0}, {"key": "d8304c60e76a4b16053e74c50abd886dcdf7397c", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.5679366363997604, "ground_truth": 0}, {"key": "d8304c60e76a4b16053e74c50abd886dcdf7397c", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.7563575762925274, "ground_truth": 0}, {"key": "d8304c60e76a4b16053e74c50abd886dcdf7397c", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.8006920087133899, "ground_truth": 0}, {"key": "d8304c60e76a4b16053e74c50abd886dcdf7397c", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.552539728393722, "ground_truth": 0}, {"key": "d47e5724a866cf365428dbded7740555e5f80f2b", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.37387581405731835, "ground_truth": 0}, {"key": "d47e5724a866cf365428dbded7740555e5f80f2b", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.7041601247198213, "ground_truth": 0}, {"key": "d47e5724a866cf365428dbded7740555e5f80f2b", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.2942149702048738, "ground_truth": 0}, {"key": "d47e5724a866cf365428dbded7740555e5f80f2b", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.35042137986268357, "ground_truth": 0}, {"key": "d47e5724a866cf365428dbded7740555e5f80f2b", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.2213506924955933, "ground_truth": 0}, {"key": "0a078513cee66db2ccaaca1b7b0755c96f0c5c8a", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.8080672154300717, "ground_truth": 0}, {"key": "0a078513cee66db2ccaaca1b7b0755c96f0c5c8a", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.9105453951771072, "ground_truth": 0}, {"key": "0a078513cee66db2ccaaca1b7b0755c96f0c5c8a", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.9278877955591236, "ground_truth": 0}, {"key": "0a078513cee66db2ccaaca1b7b0755c96f0c5c8a", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.889528855993836, "ground_truth": 0}, {"key": "0a078513cee66db2ccaaca1b7b0755c96f0c5c8a", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.9161096201578283, "ground_truth": 0}, {"key": "f0d93bdd383762936746b48f7e67ffe72cfb1ede", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.4882834040664816, "ground_truth": 0}, {"key": "f0d93bdd383762936746b48f7e67ffe72cfb1ede", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.5214711573541704, "ground_truth": 0}, {"key": "f0d93bdd383762936746b48f7e67ffe72cfb1ede", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.2735743973538922, "ground_truth": 0}, {"key": "f0d93bdd383762936746b48f7e67ffe72cfb1ede", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.39233683473493147, "ground_truth": 0}, {"key": "f0d93bdd383762936746b48f7e67ffe72cfb1ede", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.3867634283214521, "ground_truth": 0}, {"key": "38649fdccec39afa649297349b2ad2e5e1a39d82", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.7325918073577695, "ground_truth": 0}, {"key": "38649fdccec39afa649297349b2ad2e5e1a39d82", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.7662936402712198, "ground_truth": 0}, {"key": "38649fdccec39afa649297349b2ad2e5e1a39d82", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.7154240187030048, "ground_truth": 0}, {"key": "38649fdccec39afa649297349b2ad2e5e1a39d82", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.6774739973397039, "ground_truth": 0}, {"key": "38649fdccec39afa649297349b2ad2e5e1a39d82", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.6495786284253492, "ground_truth": 0}, {"key": "d86d9a4e0b39556578f24ff54ed82716f0375fdb", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.8244619364369925, "ground_truth": 0}, {"key": "d86d9a4e0b39556578f24ff54ed82716f0375fdb", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.6654105372645577, "ground_truth": 0}, {"key": "d86d9a4e0b39556578f24ff54ed82716f0375fdb", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.8872046012551653, "ground_truth": 0}, {"key": "d86d9a4e0b39556578f24ff54ed82716f0375fdb", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.8449215218782832, "ground_truth": 0}, {"key": "d86d9a4e0b39556578f24ff54ed82716f0375fdb", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.8539127558317618, "ground_truth": 0}, {"key": "d10d57811499caa54276d3e14f89c45cb1a8958f", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.3259495297936211, "ground_truth": 0}, {"key": "d10d57811499caa54276d3e14f89c45cb1a8958f", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.26740816725440963, "ground_truth": 0}, {"key": "d10d57811499caa54276d3e14f89c45cb1a8958f", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.14903529372412236, "ground_truth": 0}, {"key": "d10d57811499caa54276d3e14f89c45cb1a8958f", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.1259227671817311, "ground_truth": 0}, {"key": "d10d57811499caa54276d3e14f89c45cb1a8958f", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.26588046706573815, "ground_truth": 0}, {"key": "66646c49afb65308491ec8ca6db79aa76263cc69", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.25238404858071545, "ground_truth": 0}, {"key": "66646c49afb65308491ec8ca6db79aa76263cc69", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.6169358558161817, "ground_truth": 0}, {"key": "66646c49afb65308491ec8ca6db79aa76263cc69", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.6424324956138292, "ground_truth": 0}, {"key": "66646c49afb65308491ec8ca6db79aa76263cc69", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.6406358364995101, "ground_truth": 0}, {"key": "66646c49afb65308491ec8ca6db79aa76263cc69", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.542863275230233, "ground_truth": 0}, {"key": "7fbd6d867def06f6ae4c051562dc36ab8d0038c0", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.6859494581755279, "ground_truth": 0}, {"key": "7fbd6d867def06f6ae4c051562dc36ab8d0038c0", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.72017148820314, "ground_truth": 0}, {"key": "7fbd6d867def06f6ae4c051562dc36ab8d0038c0", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.4359015406984623, "ground_truth": 0}, {"key": "7fbd6d867def06f6ae4c051562dc36ab8d0038c0", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.44552954172208153, "ground_truth": 0}, {"key": "7fbd6d867def06f6ae4c051562dc36ab8d0038c0", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.4668456176398218, "ground_truth": 0}, {"key": "5c243b51bf4de7f6974338d71ac26317254007bb", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.8670357600505559, "ground_truth": 0}, {"key": "5c243b51bf4de7f6974338d71ac26317254007bb", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.6825737202493523, "ground_truth": 0}, {"key": "5c243b51bf4de7f6974338d71ac26317254007bb", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.9572778000577015, "ground_truth": 0}, {"key": "5c243b51bf4de7f6974338d71ac26317254007bb", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.5660185131559623, "ground_truth": 0}, {"key": "5c243b51bf4de7f6974338d71ac26317254007bb", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.8749346139166713, "ground_truth": 0}, {"key": "56b79c03a77d5261382e4705f3537396473f55cf", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.8233283965630037, "ground_truth": 0}, {"key": "56b79c03a77d5261382e4705f3537396473f55cf", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.8714748571090498, "ground_truth": 0}, {"key": "56b79c03a77d5261382e4705f3537396473f55cf", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.9278877970278719, "ground_truth": 0}, {"key": "56b79c03a77d5261382e4705f3537396473f55cf", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.8278281550508387, "ground_truth": 0}, {"key": "56b79c03a77d5261382e4705f3537396473f55cf", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.9412234378042494, "ground_truth": 0}, {"key": "7382d171d71d3219c5ad0a13ea0ac92ac6b6998b", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.7905303230637981, "ground_truth": 0}, {"key": "7382d171d71d3219c5ad0a13ea0ac92ac6b6998b", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.752012574988158, "ground_truth": 0}, {"key": "7382d171d71d3219c5ad0a13ea0ac92ac6b6998b", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.7356416509477667, "ground_truth": 0}, {"key": "7382d171d71d3219c5ad0a13ea0ac92ac6b6998b", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.8895288472160653, "ground_truth": 0}, {"key": "7382d171d71d3219c5ad0a13ea0ac92ac6b6998b", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.7217431949585413, "ground_truth": 0}, {"key": "ef1a5fa8dbba16e4d7ef3fc8cd540c2f55691fc8", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.6352224213114306, "ground_truth": 0}, {"key": "ef1a5fa8dbba16e4d7ef3fc8cd540c2f55691fc8", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.6654105713596276, "ground_truth": 0}, {"key": "ef1a5fa8dbba16e4d7ef3fc8cd540c2f55691fc8", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.7943849636182683, "ground_truth": 0}, {"key": "ef1a5fa8dbba16e4d7ef3fc8cd540c2f55691fc8", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.6187804269816535, "ground_truth": 0}, {"key": "ef1a5fa8dbba16e4d7ef3fc8cd540c2f55691fc8", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.6261241879849421, "ground_truth": 0}, {"key": "1ba0f66a7f4f23171634a3455893f4d5b8b94db4", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.5136684553326673, "ground_truth": 0}, {"key": "1ba0f66a7f4f23171634a3455893f4d5b8b94db4", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.5813030626535587, "ground_truth": 0}, {"key": "1ba0f66a7f4f23171634a3455893f4d5b8b94db4", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.5486734831404061, "ground_truth": 0}, {"key": "1ba0f66a7f4f23171634a3455893f4d5b8b94db4", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.3629691977686923, "ground_truth": 0}, {"key": "1ba0f66a7f4f23171634a3455893f4d5b8b94db4", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.511716607530866, "ground_truth": 0}, {"key": "3131e8ba238a31d83cad00bc7b02933b0a3587b3", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.6001883462131112, "ground_truth": 0}, {"key": "3131e8ba238a31d83cad00bc7b02933b0a3587b3", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.5907791928380607, "ground_truth": 0}, {"key": "3131e8ba238a31d83cad00bc7b02933b0a3587b3", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.5428632835936233, "ground_truth": 0}, {"key": "3131e8ba238a31d83cad00bc7b02933b0a3587b3", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.6976089097860101, "ground_truth": 0}, {"key": "3131e8ba238a31d83cad00bc7b02933b0a3587b3", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.4726834460467077, "ground_truth": 0}, {"key": "112bc4ab4b6e7d6dd35fc33cd946fbfc4c9356d6", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.3775406684585238, "ground_truth": 0}, {"key": "112bc4ab4b6e7d6dd35fc33cd946fbfc4c9356d6", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.44167300248702507, "ground_truth": 0}, {"key": "112bc4ab4b6e7d6dd35fc33cd946fbfc4c9356d6", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.4707366048778942, "ground_truth": 0}, {"key": "112bc4ab4b6e7d6dd35fc33cd946fbfc4c9356d6", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.40733340524684875, "ground_truth": 0}, {"key": "112bc4ab4b6e7d6dd35fc33cd946fbfc4c9356d6", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.32082131233982214, "ground_truth": 0}, {"key": "3b1d3309825780556178569cd40d880a793f8da7", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.2583259826168047, "ground_truth": 0}, {"key": "3b1d3309825780556178569cd40d880a793f8da7", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.3923368595176202, "ground_truth": 0}, {"key": "3b1d3309825780556178569cd40d880a793f8da7", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.22270012747901669, "ground_truth": 0}, {"key": "3b1d3309825780556178569cd40d880a793f8da7", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.12765261888819057, "ground_truth": 0}, {"key": "3b1d3309825780556178569cd40d880a793f8da7", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.4610167980929397, "ground_truth": 0}, {"key": "c977693b405a89cec98e53b05199e608fd6adeca", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.4263215831549895, "ground_truth": 0}, {"key": "c977693b405a89cec98e53b05199e608fd6adeca", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.6261241718025853, "ground_truth": 0}, {"key": "c977693b405a89cec98e53b05199e608fd6adeca", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.5679366035980024, "ground_truth": 0}, {"key": "c977693b405a89cec98e53b05199e608fd6adeca", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.6315943091348112, "ground_truth": 0}, {"key": "c977693b405a89cec98e53b05199e608fd6adeca", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.8140528100893749, "ground_truth": 0}, {"key": "c84e272a80fa95f863e016bc54df0841fd83fc12", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.49218814230843366, "ground_truth": 0}, {"key": "c84e272a80fa95f863e016bc54df0841fd83fc12", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.6297746153817185, "ground_truth": 0}, {"key": "c84e272a80fa95f863e016bc54df0841fd83fc12", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.46101677204211267, "ground_truth": 0}, {"key": "c84e272a80fa95f863e016bc54df0841fd83fc12", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.5679366166159755, "ground_truth": 0}, {"key": "c84e272a80fa95f863e016bc54df0841fd83fc12", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.7759445615962803, "ground_truth": 0}, {"key": "f51cff1d73cd0f3954376d7b3eab1d5b2ccb354c", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.6352224262099911, "ground_truth": 0}, {"key": "f51cff1d73cd0f3954376d7b3eab1d5b2ccb354c", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.6791786854004106, "ground_truth": 0}, {"key": "f51cff1d73cd0f3954376d7b3eab1d5b2ccb354c", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.6132365523068374, "ground_truth": 0}, {"key": "f51cff1d73cd0f3954376d7b3eab1d5b2ccb354c", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.5136684764698476, "ground_truth": 0}, {"key": "f51cff1d73cd0f3954376d7b3eab1d5b2ccb354c", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.4532618597668486, "ground_truth": 0}, {"key": "a98f1a0258f641788e570264b79e5c816f80054f", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.7074046811413347, "ground_truth": 0}, {"key": "a98f1a0258f641788e570264b79e5c816f80054f", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.3904758354897277, "ground_truth": 0}, {"key": "a98f1a0258f641788e570264b79e5c816f80054f", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.5851011491049724, "ground_truth": 0}, {"key": "a98f1a0258f641788e570264b79e5c816f80054f", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.42250460955559016, "ground_truth": 0}, {"key": "a98f1a0258f641788e570264b79e5c816f80054f", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.5755879955749201, "ground_truth": 0}, {"key": "d69d50059c96bd729e9e4c54eee7901d43c0181d", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.7969253714856958, "ground_truth": 0}, {"key": "d69d50059c96bd729e9e4c54eee7901d43c0181d", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.6619228533437267, "ground_truth": 0}, {"key": "d69d50059c96bd729e9e4c54eee7901d43c0181d", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.6943026774335775, "ground_truth": 0}, {"key": "d69d50059c96bd729e9e4c54eee7901d43c0181d", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.5253688161115206, "ground_truth": 0}, {"key": "d69d50059c96bd729e9e4c54eee7901d43c0181d", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.6297746103424877, "ground_truth": 0}, {"key": "379692c378381f092c0bae0516ea8abc5bdb98b8", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.6406358663862828, "ground_truth": 0}, {"key": "379692c378381f092c0bae0516ea8abc5bdb98b8", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.3812195492104787, "ground_truth": 0}, {"key": "379692c378381f092c0bae0516ea8abc5bdb98b8", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.5389832132445391, "ground_truth": 0}, {"key": "379692c378381f092c0bae0516ea8abc5bdb98b8", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.4629586112302142, "ground_truth": 0}, {"key": "379692c378381f092c0bae0516ea8abc5bdb98b8", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.709019158521593, "ground_truth": 0}, {"key": "88b0d86cd06cd05a090f6a6c3a3ed17bf5f96df3", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.5736783943309086, "ground_truth": 0}, {"key": "88b0d86cd06cd05a090f6a6c3a3ed17bf5f96df3", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.5926665925645277, "ground_truth": 0}, {"key": "88b0d86cd06cd05a090f6a6c3a3ed17bf5f96df3", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.6723316876763014, "ground_truth": 0}, {"key": "88b0d86cd06cd05a090f6a6c3a3ed17bf5f96df3", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.5945512783111354, "ground_truth": 0}, {"key": "88b0d86cd06cd05a090f6a6c3a3ed17bf5f96df3", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.6279512142354515, "ground_truth": 0}, {"key": "3b46e80db81819fdcb8b8044941f64d0fa5abd11", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.760650647289658, "ground_truth": 0}, {"key": "3b46e80db81819fdcb8b8044941f64d0fa5abd11", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.7505527703151672, "ground_truth": 0}, {"key": "3b46e80db81819fdcb8b8044941f64d0fa5abd11", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.7248702842222007, "ground_truth": 0}, {"key": "3b46e80db81819fdcb8b8044941f64d0fa5abd11", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.8740772248641475, "ground_truth": 0}, {"key": "3b46e80db81819fdcb8b8044941f64d0fa5abd11", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.6150878544473164, "ground_truth": 0}, {"key": "786d56f09dae2902696b680395353986051a1139", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.33458944169116894, "ground_truth": 0}, {"key": "786d56f09dae2902696b680395353986051a1139", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.27357440091515844, "ground_truth": 0}, {"key": "786d56f09dae2902696b680395353986051a1139", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.27202457859847123, "ground_truth": 0}, {"key": "786d56f09dae2902696b680395353986051a1139", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.3593641460537325, "ground_truth": 0}, {"key": "786d56f09dae2902696b680395353986051a1139", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.23651622605766368, "ground_truth": 0}, {"key": "bf1a3fd65fdd6e91ccec0663d80fa567eada14df", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.7866228343051389, "ground_truth": 0}, {"key": "bf1a3fd65fdd6e91ccec0663d80fa567eada14df", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.6406358463634313, "ground_truth": 0}, {"key": "bf1a3fd65fdd6e91ccec0663d80fa567eada14df", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.5983122074453702, "ground_truth": 0}, {"key": "bf1a3fd65fdd6e91ccec0663d80fa567eada14df", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.7356416441564458, "ground_truth": 0}, {"key": "bf1a3fd65fdd6e91ccec0663d80fa567eada14df", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.7233094813636995, "ground_truth": 0}, {"key": "a0bd3047a6de80e3924843f1961ce28347c6a548", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.5214711590811895, "ground_truth": 0}, {"key": "a0bd3047a6de80e3924843f1961ce28347c6a548", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.848972196723054, "ground_truth": 0}, {"key": "a0bd3047a6de80e3924843f1961ce28347c6a548", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.509764396091871, "ground_truth": 0}, {"key": "a0bd3047a6de80e3924843f1961ce28347c6a548", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.6636689565920963, "ground_truth": 0}, {"key": "a0bd3047a6de80e3924843f1961ce28347c6a548", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.5, "ground_truth": 0}, {"key": "090d322e93af624203dbd5dc83403170071c9e6a", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.71542398478352, "ground_truth": 0}, {"key": "090d322e93af624203dbd5dc83403170071c9e6a", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.9399133528087141, "ground_truth": 0}, {"key": "090d322e93af624203dbd5dc83403170071c9e6a", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.7956580917717866, "ground_truth": 0}, {"key": "090d322e93af624203dbd5dc83403170071c9e6a", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.7356416375628441, "ground_truth": 0}, {"key": "090d322e93af624203dbd5dc83403170071c9e6a", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.7310585685375535, "ground_truth": 0}, {"key": "ed5179817cb8f597a760800fcdce2b8e64fd30dc", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.2674081794940546, "ground_truth": 0}, {"key": "ed5179817cb8f597a760800fcdce2b8e64fd30dc", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.6876299989498891, "ground_truth": 0}, {"key": "ed5179817cb8f597a760800fcdce2b8e64fd30dc", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.5964331644780245, "ground_truth": 0}, {"key": "ed5179817cb8f597a760800fcdce2b8e64fd30dc", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.31742625310176736, "ground_truth": 0}, {"key": "ed5179817cb8f597a760800fcdce2b8e64fd30dc", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.5428632844515034, "ground_truth": 0}, {"key": "571a8023d0deed8c667dd41fed88290309e56927", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.24508500900688493, "ground_truth": 0}, {"key": "571a8023d0deed8c667dd41fed88290309e56927", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.3979384175357735, "ground_truth": 0}, {"key": "571a8023d0deed8c667dd41fed88290309e56927", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.17217184614914305, "ground_truth": 0}, {"key": "571a8023d0deed8c667dd41fed88290309e56927", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.35936413949955176, "ground_truth": 0}, {"key": "571a8023d0deed8c667dd41fed88290309e56927", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.25534364994995834, "ground_truth": 0}, {"key": "544d7c0cba7df38cc8dda8d0d91c6845cf5f52bb", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.33982762465737704, "ground_truth": 0}, {"key": "544d7c0cba7df38cc8dda8d0d91c6845cf5f52bb", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.49609382503379357, "ground_truth": 0}, {"key": "544d7c0cba7df38cc8dda8d0d91c6845cf5f52bb", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.4035668577654068, "ground_truth": 0}, {"key": "544d7c0cba7df38cc8dda8d0d91c6845cf5f52bb", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.3363310571190335, "ground_truth": 0}, {"key": "544d7c0cba7df38cc8dda8d0d91c6845cf5f52bb", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.7295197711067697, "ground_truth": 0}, {"key": "cbd3a0715a91ac8f651aa7b1f2c1fb37a2ef8a69", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.6224593631948945, "ground_truth": 0}, {"key": "cbd3a0715a91ac8f651aa7b1f2c1fb37a2ef8a69", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.6959583302906414, "ground_truth": 0}, {"key": "cbd3a0715a91ac8f651aa7b1f2c1fb37a2ef8a69", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.7826624921914048, "ground_truth": 0}, {"key": "cbd3a0715a91ac8f651aa7b1f2c1fb37a2ef8a69", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.7074046981741493, "ground_truth": 0}, {"key": "cbd3a0715a91ac8f651aa7b1f2c1fb37a2ef8a69", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.46295859560485614, "ground_truth": 0}, {"key": "4ca8b3cf75948dffea7b96e71bf1d9621107354b", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.9615338044468361, "ground_truth": 0}, {"key": "4ca8b3cf75948dffea7b96e71bf1d9621107354b", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.9553191275691787, "ground_truth": 0}, {"key": "4ca8b3cf75948dffea7b96e71bf1d9621107354b", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.9207896777463568, "ground_truth": 0}, {"key": "4ca8b3cf75948dffea7b96e71bf1d9621107354b", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.9367494764433024, "ground_truth": 0}, {"key": "4ca8b3cf75948dffea7b96e71bf1d9621107354b", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.9167080774197097, "ground_truth": 0}, {"key": "98f04e49605f36e0236b206fcb26a1549a7c00c6", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.791821066758462, "ground_truth": 0}, {"key": "98f04e49605f36e0236b206fcb26a1549a7c00c6", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.6671476524969099, "ground_truth": 0}, {"key": "98f04e49605f36e0236b206fcb26a1549a7c00c6", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.7264256194621872, "ground_truth": 0}, {"key": "98f04e49605f36e0236b206fcb26a1549a7c00c6", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.7279754591633798, "ground_truth": 0}, {"key": "98f04e49605f36e0236b206fcb26a1549a7c00c6", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.8459424340001017, "ground_truth": 0}, {"key": "fb0003754a764d7f3252120de58b515d1f882556", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.6566582553630539, "ground_truth": 0}, {"key": "fb0003754a764d7f3252120de58b515d1f882556", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.7606506741467358, "ground_truth": 0}, {"key": "fb0003754a764d7f3252120de58b515d1f882556", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.7718435031383769, "ground_truth": 0}, {"key": "fb0003754a764d7f3252120de58b515d1f882556", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.6315942890563868, "ground_truth": 0}, {"key": "fb0003754a764d7f3252120de58b515d1f882556", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.5736784103629, "ground_truth": 0}, {"key": "0130f10c1d700cf42cad5fd24b242667342c86be", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.685949472828049, "ground_truth": 0}, {"key": "0130f10c1d700cf42cad5fd24b242667342c86be", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.44939261857029555, "ground_truth": 0}, {"key": "0130f10c1d700cf42cad5fd24b242667342c86be", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.5292633606408255, "ground_truth": 0}, {"key": "0130f10c1d700cf42cad5fd24b242667342c86be", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.5544704726114313, "ground_truth": 0}, {"key": "0130f10c1d700cf42cad5fd24b242667342c86be", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.44746029670062093, "ground_truth": 0}, {"key": "fb8431bc320c2c1a6c32699da0fdae228ed8d73b", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.4359015254953304, "ground_truth": 0}, {"key": "fb8431bc320c2c1a6c32699da0fdae228ed8d73b", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.5525397057803741, "ground_truth": 0}, {"key": "fb8431bc320c2c1a6c32699da0fdae228ed8d73b", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.4960938256894638, "ground_truth": 0}, {"key": "fb8431bc320c2c1a6c32699da0fdae228ed8d73b", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.6636689509639191, "ground_truth": 0}, {"key": "fb8431bc320c2c1a6c32699da0fdae228ed8d73b", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.29910519720174966, "ground_truth": 0}, {"key": "875d564015e85f88103edf0b36ce10e292334902", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.6460137101470779, "ground_truth": 0}, {"key": "875d564015e85f88103edf0b36ce10e292334902", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.7772998741740452, "ground_truth": 0}, {"key": "875d564015e85f88103edf0b36ce10e292334902", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.8807970832971113, "ground_truth": 0}, {"key": "875d564015e85f88103edf0b36ce10e292334902", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.4960938126190704, "ground_truth": 0}, {"key": "875d564015e85f88103edf0b36ce10e292334902", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.8749346108856367, "ground_truth": 0}, {"key": "53102b470b50905c033a90940fc6fa87190f7343", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.6388352879812154, "ground_truth": 0}, {"key": "53102b470b50905c033a90940fc6fa87190f7343", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.6020615771252521, "ground_truth": 0}, {"key": "53102b470b50905c033a90940fc6fa87190f7343", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.540923861670597, "ground_truth": 0}, {"key": "53102b470b50905c033a90940fc6fa87190f7343", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.6206216057732474, "ground_truth": 0}, {"key": "53102b470b50905c033a90940fc6fa87190f7343", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.4863315327858763, "ground_truth": 0}, {"key": "58776b77856719aff45f09e50d370f52c756dc10", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.8140527905245697, "ground_truth": 0}, {"key": "58776b77856719aff45f09e50d370f52c756dc10", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.8438951161976358, "ground_truth": 0}, {"key": "58776b77856719aff45f09e50d370f52c756dc10", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.7786493097576842, "ground_truth": 0}, {"key": "58776b77856719aff45f09e50d370f52c756dc10", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.7041601672761145, "ground_truth": 0}, {"key": "58776b77856719aff45f09e50d370f52c756dc10", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.9066531233005455, "ground_truth": 0}, {"key": "1b1479bb6e290e86e4b2a1e862e06909a0a62f8e", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.3468730742390984, "ground_truth": 0}, {"key": "1b1479bb6e290e86e4b2a1e862e06909a0a62f8e", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.45326184719669527, "ground_truth": 0}, {"key": "1b1479bb6e290e86e4b2a1e862e06909a0a62f8e", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.2877678199559889, "ground_truth": 0}, {"key": "1b1479bb6e290e86e4b2a1e862e06909a0a62f8e", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.38861801532844836, "ground_truth": 0}, {"key": "1b1479bb6e290e86e4b2a1e862e06909a0a62f8e", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.5467381305770357, "ground_truth": 0}, {"key": "137019bb8262f8ab776ec6367a0ae4b020fa638e", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.44939265614659496, "ground_truth": 0}, {"key": "137019bb8262f8ab776ec6367a0ae4b020fa638e", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.39233681862617054, "ground_truth": 0}, {"key": "137019bb8262f8ab776ec6367a0ae4b020fa638e", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.23231012612479016, "ground_truth": 0}, {"key": "137019bb8262f8ab776ec6367a0ae4b020fa638e", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.41679661786398653, "ground_truth": 0}, {"key": "137019bb8262f8ab776ec6367a0ae4b020fa638e", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.3849121179110342, "ground_truth": 0}, {"key": "1f738e018a3a193d04ec22612e4fe6b01b4969fe", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.6460136974829528, "ground_truth": 0}, {"key": "1f738e018a3a193d04ec22612e4fe6b01b4969fe", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.5350984157638905, "ground_truth": 0}, {"key": "1f738e018a3a193d04ec22612e4fe6b01b4969fe", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.7057850369884489, "ground_truth": 0}, {"key": "1f738e018a3a193d04ec22612e4fe6b01b4969fe", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.7295197684933177, "ground_truth": 0}, {"key": "1f738e018a3a193d04ec22612e4fe6b01b4969fe", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.6926419922191266, "ground_truth": 0}, {"key": "2bb7b7d5a229ccb9c9b5b4fa1475a54297fc0a25", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.8175744714766892, "ground_truth": 0}, {"key": "2bb7b7d5a229ccb9c9b5b4fa1475a54297fc0a25", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.8469578366371314, "ground_truth": 0}, {"key": "2bb7b7d5a229ccb9c9b5b4fa1475a54297fc0a25", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.8333245986324769, "ground_truth": 0}, {"key": "2bb7b7d5a229ccb9c9b5b4fa1475a54297fc0a25", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.8615382100144321, "ground_truth": 0}, {"key": "2bb7b7d5a229ccb9c9b5b4fa1475a54297fc0a25", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.825589723221083, "ground_truth": 0}, {"key": "c136c209869b227e534aca60b6df7e0b26bce7fe", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.8577680940569997, "ground_truth": 0}, {"key": "c136c209869b227e534aca60b6df7e0b26bce7fe", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.7662936647181152, "ground_truth": 0}, {"key": "c136c209869b227e534aca60b6df7e0b26bce7fe", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.6757645869433864, "ground_truth": 0}, {"key": "c136c209869b227e534aca60b6df7e0b26bce7fe", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.8300437580872779, "ground_truth": 0}, {"key": "c136c209869b227e534aca60b6df7e0b26bce7fe", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.8469578378094836, "ground_truth": 0}, {"key": "bfbf2be3d5b9da8425253502393528d0f95d2b5d", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.5640984661369859, "ground_truth": 0}, {"key": "bfbf2be3d5b9da8425253502393528d0f95d2b5d", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.9273632906724716, "ground_truth": 0}, {"key": "bfbf2be3d5b9da8425253502393528d0f95d2b5d", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.9161096086929792, "ground_truth": 0}, {"key": "bfbf2be3d5b9da8425253502393528d0f95d2b5d", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.651354867263076, "ground_truth": 0}, {"key": "bfbf2be3d5b9da8425253502393528d0f95d2b5d", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.8697145791918316, "ground_truth": 0}, {"key": "de149988c9768a12f4a656f1d86efe42af51b4c8", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.6842640157021915, "ground_truth": 0}, {"key": "de149988c9768a12f4a656f1d86efe42af51b4c8", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.6406358568074868, "ground_truth": 0}, {"key": "de149988c9768a12f4a656f1d86efe42af51b4c8", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.749087220005612, "ground_truth": 0}, {"key": "de149988c9768a12f4a656f1d86efe42af51b4c8", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.8479677418941257, "ground_truth": 0}, {"key": "de149988c9768a12f4a656f1d86efe42af51b4c8", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.8568122882535399, "ground_truth": 0}, {"key": "45986f43dd61461844801c08c8753a71ccbf9083", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.8233284183636419, "ground_truth": 0}, {"key": "45986f43dd61461844801c08c8753a71ccbf9083", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.8807970774036397, "ground_truth": 0}, {"key": "45986f43dd61461844801c08c8753a71ccbf9083", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.7386690823759686, "ground_truth": 0}, {"key": "45986f43dd61461844801c08c8753a71ccbf9083", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.8407825934085504, "ground_truth": 0}, {"key": "45986f43dd61461844801c08c8753a71ccbf9083", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.853912758032536, "ground_truth": 0}, {"key": "e27256e1314f48219ceca70c273dd8429fc4ca4f", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.7138307359710467, "ground_truth": 0}, {"key": "e27256e1314f48219ceca70c273dd8429fc4ca4f", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.6460136844307365, "ground_truth": 0}, {"key": "e27256e1314f48219ceca70c273dd8429fc4ca4f", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.7138307412031485, "ground_truth": 0}, {"key": "e27256e1314f48219ceca70c273dd8429fc4ca4f", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.5078118359108658, "ground_truth": 0}, {"key": "e27256e1314f48219ceca70c273dd8429fc4ca4f", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.6636689537451915, "ground_truth": 0}, {"key": "8da9fddf6f4a0d798e454ee7b778ce0d7ce3c447", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.525368827236027, "ground_truth": 0}, {"key": "8da9fddf6f4a0d798e454ee7b778ce0d7ce3c447", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.7325918407852673, "ground_truth": 0}, {"key": "8da9fddf6f4a0d798e454ee7b778ce0d7ce3c447", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.4092207991711065, "ground_truth": 0}, {"key": "8da9fddf6f4a0d798e454ee7b778ce0d7ce3c447", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.695958330026186, "ground_truth": 0}, {"key": "8da9fddf6f4a0d798e454ee7b778ce0d7ce3c447", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.4649015755183353, "ground_truth": 0}, {"key": "d2e357c372891291bbdb4f496792ea9d5807cd3a", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.791821073638612, "ground_truth": 0}, {"key": "d2e357c372891291bbdb4f496792ea9d5807cd3a", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.7606506693342269, "ground_truth": 0}, {"key": "d2e357c372891291bbdb4f496792ea9d5807cd3a", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.7799929029338853, "ground_truth": 0}, {"key": "d2e357c372891291bbdb4f496792ea9d5807cd3a", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.9339146262366725, "ground_truth": 0}, {"key": "d2e357c372891291bbdb4f496792ea9d5807cd3a", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.8832359903493376, "ground_truth": 0}, {"key": "2a17cad6a35f54ceab81d03772a75c58aa7147ef", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.28457599078802703, "ground_truth": 0}, {"key": "2a17cad6a35f54ceab81d03772a75c58aa7147ef", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.3056973275370233, "ground_truth": 0}, {"key": "2a17cad6a35f54ceab81d03772a75c58aa7147ef", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.5312093769995211, "ground_truth": 0}, {"key": "2a17cad6a35f54ceab81d03772a75c58aa7147ef", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.41111086700055466, "ground_truth": 0}, {"key": "2a17cad6a35f54ceab81d03772a75c58aa7147ef", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.3960681862691661, "ground_truth": 0}, {"key": "4b25022fda48e7f91ab1459f1a6dca501318672e", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.4513265280545749, "ground_truth": 0}, {"key": "4b25022fda48e7f91ab1459f1a6dca501318672e", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.548673469614503, "ground_truth": 0}, {"key": "4b25022fda48e7f91ab1459f1a6dca501318672e", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.6261241985473394, "ground_truth": 0}, {"key": "4b25022fda48e7f91ab1459f1a6dca501318672e", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.7074046785448339, "ground_truth": 0}, {"key": "4b25022fda48e7f91ab1459f1a6dca501318672e", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.5621764921227704, "ground_truth": 0}, {"key": "62066d76f4ef9e06a1129551c41371bb5d2f7465", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.881614900669652, "ground_truth": 0}, {"key": "62066d76f4ef9e06a1129551c41371bb5d2f7465", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.8783142491637693, "ground_truth": 0}, {"key": "62066d76f4ef9e06a1129551c41371bb5d2f7465", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.9546474183341637, "ground_truth": 0}, {"key": "62066d76f4ef9e06a1129551c41371bb5d2f7465", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.8418256483665533, "ground_truth": 0}, {"key": "62066d76f4ef9e06a1129551c41371bb5d2f7465", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.8606036145517068, "ground_truth": 0}, {"key": "16c4a27e42066259797d93d5db0239bce0a15f18", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.8289388173980341, "ground_truth": 0}, {"key": "16c4a27e42066259797d93d5db0239bce0a15f18", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.8210441103313204, "ground_truth": 0}, {"key": "16c4a27e42066259797d93d5db0239bce0a15f18", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.8723473752227773, "ground_truth": 0}, {"key": "16c4a27e42066259797d93d5db0239bce0a15f18", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.7461389781637031, "ground_truth": 0}, {"key": "16c4a27e42066259797d93d5db0239bce0a15f18", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.8187367942129983, "ground_truth": 0}, {"key": "8626e8d0c96f4d12eca92423e0c43c6ea3e53545", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.6959583423557298, "ground_truth": 0}, {"key": "8626e8d0c96f4d12eca92423e0c43c6ea3e53545", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.8766343796113663, "ground_truth": 0}, {"key": "8626e8d0c96f4d12eca92423e0c43c6ea3e53545", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.6187804235669088, "ground_truth": 0}, {"key": "8626e8d0c96f4d12eca92423e0c43c6ea3e53545", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.7170118972192191, "ground_truth": 0}, {"key": "8626e8d0c96f4d12eca92423e0c43c6ea3e53545", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.7772998652623215, "ground_truth": 0}, {"key": "f675d806e17d1920e6622d3a925367697c94e58e", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.7217432277168183, "ground_truth": 0}, {"key": "f675d806e17d1920e6622d3a925367697c94e58e", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.8210441222271108, "ground_truth": 0}, {"key": "f675d806e17d1920e6622d3a925367697c94e58e", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.9184802499475324, "ground_truth": 0}, {"key": "f675d806e17d1920e6622d3a925367697c94e58e", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.6601723648015575, "ground_truth": 0}, {"key": "f675d806e17d1920e6622d3a925367697c94e58e", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.6584175034454292, "ground_truth": 0}, {"key": "835b6e4637bd2c3fe2644f2cefa00270e950ebdf", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.4205995843919615, "ground_truth": 0}, {"key": "835b6e4637bd2c3fe2644f2cefa00270e950ebdf", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.7866228372226485, "ground_truth": 0}, {"key": "835b6e4637bd2c3fe2644f2cefa00270e950ebdf", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.6893056044649828, "ground_truth": 0}, {"key": "835b6e4637bd2c3fe2644f2cefa00270e950ebdf", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.5156199298049463, "ground_truth": 0}, {"key": "835b6e4637bd2c3fe2644f2cefa00270e950ebdf", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.7676898563597832, "ground_truth": 0}, {"key": "aec90720358f66b9d149db8afd08fbb821e3aa52", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.45713672758527407, "ground_truth": 0}, {"key": "aec90720358f66b9d149db8afd08fbb821e3aa52", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.6842640144420072, "ground_truth": 0}, {"key": "aec90720358f66b9d149db8afd08fbb821e3aa52", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.5195213344798137, "ground_truth": 0}, {"key": "aec90720358f66b9d149db8afd08fbb821e3aa52", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.626124175466573, "ground_truth": 0}, {"key": "aec90720358f66b9d149db8afd08fbb821e3aa52", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.7025300630895569, "ground_truth": 0}, {"key": "0033829349643e2964a8c3ce5fd997116ce43f7c", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.7248702805013844, "ground_truth": 0}, {"key": "0033829349643e2964a8c3ce5fd997116ce43f7c", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.7248702671864855, "ground_truth": 0}, {"key": "0033829349643e2964a8c3ce5fd997116ce43f7c", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.8311430463761628, "ground_truth": 0}, {"key": "0033829349643e2964a8c3ce5fd997116ce43f7c", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.5698526400485453, "ground_truth": 0}, {"key": "0033829349643e2964a8c3ce5fd997116ce43f7c", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.8910549416578362, "ground_truth": 0}, {"key": "3276a47234f0aa9eb7d4d06940ffb912be059454", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.692641986719021, "ground_truth": 0}, {"key": "3276a47234f0aa9eb7d4d06940ffb912be059454", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.6548947588573166, "ground_truth": 0}, {"key": "3276a47234f0aa9eb7d4d06940ffb912be059454", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.7853085845726655, "ground_truth": 0}, {"key": "3276a47234f0aa9eb7d4d06940ffb912be059454", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.8068526330330679, "ground_truth": 0}, {"key": "3276a47234f0aa9eb7d4d06940ffb912be059454", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.6548947275398668, "ground_truth": 0}, {"key": "8d3bb51d711ce00e3fff53625a70923985573834", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.6224593200801053, "ground_truth": 0}, {"key": "8d3bb51d711ce00e3fff53625a70923985573834", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.583203347607774, "ground_truth": 0}, {"key": "8d3bb51d711ce00e3fff53625a70923985573834", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.679178683526477, "ground_truth": 0}, {"key": "8d3bb51d711ce00e3fff53625a70923985573834", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.6601723706966631, "ground_truth": 0}, {"key": "8d3bb51d711ce00e3fff53625a70923985573834", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.600188357293268, "ground_truth": 0}, {"key": "e43fc7e34d05a75894279f55935b25040a6d7017", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.5945512792692939, "ground_truth": 0}, {"key": "e43fc7e34d05a75894279f55935b25040a6d7017", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.5292633899490079, "ground_truth": 0}, {"key": "e43fc7e34d05a75894279f55935b25040a6d7017", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.4167966653452883, "ground_truth": 0}, {"key": "e43fc7e34d05a75894279f55935b25040a6d7017", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.615087856304596, "ground_truth": 0}, {"key": "e43fc7e34d05a75894279f55935b25040a6d7017", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.7279754352487927, "ground_truth": 0}, {"key": "518daa3f4d9f4eb8d3e6dec7852c8b645d1ceb49", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.4186968854454822, "ground_truth": 0}, {"key": "518daa3f4d9f4eb8d3e6dec7852c8b645d1ceb49", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.5964331445774831, "ground_truth": 0}, {"key": "518daa3f4d9f4eb8d3e6dec7852c8b645d1ceb49", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.5621765116522555, "ground_truth": 0}, {"key": "518daa3f4d9f4eb8d3e6dec7852c8b645d1ceb49", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.4921881259368069, "ground_truth": 0}, {"key": "518daa3f4d9f4eb8d3e6dec7852c8b645d1ceb49", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.5486734956118817, "ground_truth": 0}, {"key": "a86f10b66912e0221e9ad4d44c37fc7f4e138ed2", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.9693241999803789, "ground_truth": 0}, {"key": "a86f10b66912e0221e9ad4d44c37fc7f4e138ed2", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.9504109790423545, "ground_truth": 0}, {"key": "a86f10b66912e0221e9ad4d44c37fc7f4e138ed2", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.9465966670537973, "ground_truth": 0}, {"key": "a86f10b66912e0221e9ad4d44c37fc7f4e138ed2", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.9645892720261336, "ground_truth": 0}, {"key": "a86f10b66912e0221e9ad4d44c37fc7f4e138ed2", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.9334308143673941, "ground_truth": 0}, {"key": "a34829c5a83a3ef39c34b57b65cc48c9bf11f14b", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.6406358663862828, "ground_truth": 0}, {"key": "a34829c5a83a3ef39c34b57b65cc48c9bf11f14b", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.3812195492104787, "ground_truth": 0}, {"key": "a34829c5a83a3ef39c34b57b65cc48c9bf11f14b", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.37204880589112005, "ground_truth": 0}, {"key": "a34829c5a83a3ef39c34b57b65cc48c9bf11f14b", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.46101677407051306, "ground_truth": 0}, {"key": "a34829c5a83a3ef39c34b57b65cc48c9bf11f14b", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.5945512778992764, "ground_truth": 0}, {"key": "05c6b2a21f9c0ffd5f0c76c9ce4c6d3d875fcf39", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.7185943883023908, "ground_truth": 0}, {"key": "05c6b2a21f9c0ffd5f0c76c9ce4c6d3d875fcf39", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.8376199885410516, "ground_truth": 0}, {"key": "05c6b2a21f9c0ffd5f0c76c9ce4c6d3d875fcf39", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.3886180178897819, "ground_truth": 0}, {"key": "05c6b2a21f9c0ffd5f0c76c9ce4c6d3d875fcf39", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.4590761266548968, "ground_truth": 0}, {"key": "05c6b2a21f9c0ffd5f0c76c9ce4c6d3d875fcf39", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.7943849684865755, "ground_truth": 0}, {"key": "b3e6507640b009ed51c8c8f8be85d0b7fec5b579", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.8791467681316834, "ground_truth": 0}, {"key": "b3e6507640b009ed51c8c8f8be85d0b7fec5b579", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.8732148320484674, "ground_truth": 0}, {"key": "b3e6507640b009ed51c8c8f8be85d0b7fec5b579", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.8489721957538918, "ground_truth": 0}, {"key": "b3e6507640b009ed51c8c8f8be85d0b7fec5b579", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.7057849996284093, "ground_truth": 0}, {"key": "b3e6507640b009ed51c8c8f8be85d0b7fec5b579", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.8558511451964133, "ground_truth": 0}, {"key": "6e930c55a62640d218e4b94f39cb7c83b6ad9117", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.44167300253942177, "ground_truth": 0}, {"key": "6e930c55a62640d218e4b94f39cb7c83b6ad9117", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.3979384322287881, "ground_truth": 0}, {"key": "6e930c55a62640d218e4b94f39cb7c83b6ad9117", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.33633104400256963, "ground_truth": 0}, {"key": "6e930c55a62640d218e4b94f39cb7c83b6ad9117", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.30239108285435673, "ground_truth": 0}, {"key": "6e930c55a62640d218e4b94f39cb7c83b6ad9117", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.3775406668311762, "ground_truth": 0}, {"key": "cd13c83364964da3b3659782e6ef0d2b3dc273b1", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.7325918376036223, "ground_truth": 0}, {"key": "cd13c83364964da3b3659782e6ef0d2b3dc273b1", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.7577943608231149, "ground_truth": 0}, {"key": "cd13c83364964da3b3659782e6ef0d2b3dc273b1", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.8333245992488643, "ground_truth": 0}, {"key": "cd13c83364964da3b3659782e6ef0d2b3dc273b1", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.6671476589962831, "ground_truth": 0}, {"key": "cd13c83364964da3b3659782e6ef0d2b3dc273b1", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.884837771222243, "ground_truth": 0}, {"key": "328210eaa50ae54cc3d979958c1d2008faa27401", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.44746029017664907, "ground_truth": 0}, {"key": "328210eaa50ae54cc3d979958c1d2008faa27401", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.6297745948631139, "ground_truth": 0}, {"key": "328210eaa50ae54cc3d979958c1d2008faa27401", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.658417504822166, "ground_truth": 0}, {"key": "328210eaa50ae54cc3d979958c1d2008faa27401", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.7057850208598421, "ground_truth": 0}, {"key": "328210eaa50ae54cc3d979958c1d2008faa27401", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.5389832490789669, "ground_truth": 0}, {"key": "b67b63d1da9cccd6e229d5755065d57dd1653feb", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.7041601332439713, "ground_truth": 0}, {"key": "b67b63d1da9cccd6e229d5755065d57dd1653feb", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.5698526433333349, "ground_truth": 0}, {"key": "b67b63d1da9cccd6e229d5755065d57dd1653feb", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.8128673279727722, "ground_truth": 0}, {"key": "b67b63d1da9cccd6e229d5755065d57dd1653feb", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.8714748690748254, "ground_truth": 0}, {"key": "b67b63d1da9cccd6e229d5755065d57dd1653feb", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.5370413834879821, "ground_truth": 0}, {"key": "e4c55cb4bb6e5418d8486fb7c9369b6c84b2716d", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.5312093735951517, "ground_truth": 0}, {"key": "e4c55cb4bb6e5418d8486fb7c9369b6c84b2716d", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.7371581514909195, "ground_truth": 0}, {"key": "e4c55cb4bb6e5418d8486fb7c9369b6c84b2716d", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.618780441193584, "ground_truth": 0}, {"key": "e4c55cb4bb6e5418d8486fb7c9369b6c84b2716d", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.743168005851968, "ground_truth": 0}, {"key": "e4c55cb4bb6e5418d8486fb7c9369b6c84b2716d", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.5679366036132139, "ground_truth": 0}, {"key": "544b165ad1d22a5dcbbab469a2aa7666c2868361", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.43782350309338924, "ground_truth": 0}, {"key": "544b165ad1d22a5dcbbab469a2aa7666c2868361", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.46490159954693894, "ground_truth": 0}, {"key": "544b165ad1d22a5dcbbab469a2aa7666c2868361", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.32594950352143776, "ground_truth": 0}, {"key": "544b165ad1d22a5dcbbab469a2aa7666c2868361", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.3191213992648518, "ground_truth": 0}, {"key": "544b165ad1d22a5dcbbab469a2aa7666c2868361", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.4378234871882624, "ground_truth": 0}, {"key": "2577ef64a22c06cf63cb244abfad9ecc46603208", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.5, "ground_truth": 0}, {"key": "2577ef64a22c06cf63cb244abfad9ecc46603208", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.43590152637532453, "ground_truth": 0}, {"key": "2577ef64a22c06cf63cb244abfad9ecc46603208", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.7106283049033667, "ground_truth": 0}, {"key": "2577ef64a22c06cf63cb244abfad9ecc46603208", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.29098086965704095, "ground_truth": 0}, {"key": "2577ef64a22c06cf63cb244abfad9ecc46603208", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.8300437707846255, "ground_truth": 0}, {"key": "2a73430dd3232ad3da7570a5ac133d7f29a6b6c6", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.9105453962807936, "ground_truth": 0}, {"key": "2a73430dd3232ad3da7570a5ac133d7f29a6b6c6", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.9246877003460992, "ground_truth": 0}, {"key": "2a73430dd3232ad3da7570a5ac133d7f29a6b6c6", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.9358173579380854, "ground_truth": 0}, {"key": "2a73430dd3232ad3da7570a5ac133d7f29a6b6c6", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.8587185849963236, "ground_truth": 0}, {"key": "2a73430dd3232ad3da7570a5ac133d7f29a6b6c6", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.9178933735166248, "ground_truth": 0}, {"key": "8fbcaf3abc124b7baaa278d382411f43e7e48353", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.49023563239182455, "ground_truth": 0}, {"key": "8fbcaf3abc124b7baaa278d382411f43e7e48353", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.513668443637552, "ground_truth": 0}, {"key": "8fbcaf3abc124b7baaa278d382411f43e7e48353", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.36296922271408727, "ground_truth": 0}, {"key": "8fbcaf3abc124b7baaa278d382411f43e7e48353", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.6334102588832444, "ground_truth": 0}, {"key": "8fbcaf3abc124b7baaa278d382411f43e7e48353", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.38861800939183566, "ground_truth": 0}, {"key": "bc04e5a298854589044eb5a162f281f3e7e12c16", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.30569731777761616, "ground_truth": 0}, {"key": "bc04e5a298854589044eb5a162f281f3e7e12c16", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.2030746280649171, "ground_truth": 0}, {"key": "bc04e5a298854589044eb5a162f281f3e7e12c16", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.4111108450729666, "ground_truth": 0}, {"key": "bc04e5a298854589044eb5a162f281f3e7e12c16", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.2798285089571818, "ground_truth": 0}, {"key": "bc04e5a298854589044eb5a162f281f3e7e12c16", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.225416627543108, "ground_truth": 0}, {"key": "8c3b7358950d0684a90736fc39d08340d3ec41ee", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.366589739529354, "ground_truth": 0}, {"key": "8c3b7358950d0684a90736fc39d08340d3ec41ee", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.41869691951322985, "ground_truth": 0}, {"key": "8c3b7358950d0684a90736fc39d08340d3ec41ee", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.42250463175167646, "ground_truth": 0}, {"key": "8c3b7358950d0684a90736fc39d08340d3ec41ee", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.6057990652006593, "ground_truth": 0}, {"key": "8c3b7358950d0684a90736fc39d08340d3ec41ee", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.32423539253841344, "ground_truth": 0}, {"key": "d1a86381ca59e3471d2863688229922f83218150", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.6406358587143954, "ground_truth": 0}, {"key": "d1a86381ca59e3471d2863688229922f83218150", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.7620700936217336, "ground_truth": 0}, {"key": "d1a86381ca59e3471d2863688229922f83218150", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.480478669578074, "ground_truth": 0}, {"key": "d1a86381ca59e3471d2863688229922f83218150", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.602061585786834, "ground_truth": 0}, {"key": "d1a86381ca59e3471d2863688229922f83218150", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.5389832171738854, "ground_truth": 0}, {"key": "313d98f4c6047ff556795b6da47e42e9f650946a", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.7264256104644434, "ground_truth": 0}, {"key": "313d98f4c6047ff556795b6da47e42e9f650946a", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.8210440929139509, "ground_truth": 0}, {"key": "313d98f4c6047ff556795b6da47e42e9f650946a", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.5292633894766056, "ground_truth": 0}, {"key": "313d98f4c6047ff556795b6da47e42e9f650946a", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.35398630118428415, "ground_truth": 0}, {"key": "313d98f4c6047ff556795b6da47e42e9f650946a", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.5832033634187394, "ground_truth": 0}, {"key": "8c0934c689bbc9234dc51eff9d8d156aec106ca4", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.6992543896595149, "ground_truth": 0}, {"key": "8c0934c689bbc9234dc51eff9d8d156aec106ca4", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.7386690792568363, "ground_truth": 0}, {"key": "8c0934c689bbc9234dc51eff9d8d156aec106ca4", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.6740504714169511, "ground_truth": 0}, {"key": "8c0934c689bbc9234dc51eff9d8d156aec106ca4", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.49804687083774646, "ground_truth": 0}, {"key": "8c0934c689bbc9234dc51eff9d8d156aec106ca4", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.8449215339597939, "ground_truth": 0}, {"key": "70f210b63211c32ab22354506b7bd9b80ee194af", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.548673488140508, "ground_truth": 0}, {"key": "70f210b63211c32ab22354506b7bd9b80ee194af", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.39981165838135885, "ground_truth": 0}, {"key": "70f210b63211c32ab22354506b7bd9b80ee194af", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.527316528233157, "ground_truth": 0}, {"key": "70f210b63211c32ab22354506b7bd9b80ee194af", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.5039062037044021, "ground_truth": 0}, {"key": "70f210b63211c32ab22354506b7bd9b80ee194af", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.6876299896728154, "ground_truth": 0}, {"key": "dea4bf4a53b568dea8b3d5009a24d090485be8c9", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.7264256167531781, "ground_truth": 0}, {"key": "dea4bf4a53b568dea8b3d5009a24d090485be8c9", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.626124190780906, "ground_truth": 0}, {"key": "dea4bf4a53b568dea8b3d5009a24d090485be8c9", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.5851011562815654, "ground_truth": 0}, {"key": "dea4bf4a53b568dea8b3d5009a24d090485be8c9", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.7676898459926985, "ground_truth": 0}, {"key": "dea4bf4a53b568dea8b3d5009a24d090485be8c9", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.718594389626348, "ground_truth": 0}, {"key": "3ffb4210cf832dc039ffe7522c47c6eb7a5e5ab5", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.4474602830807968, "ground_truth": 0}, {"key": "3ffb4210cf832dc039ffe7522c47c6eb7a5e5ab5", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.6297746153817185, "ground_truth": 0}, {"key": "3ffb4210cf832dc039ffe7522c47c6eb7a5e5ab5", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.5736784149734274, "ground_truth": 0}, {"key": "3ffb4210cf832dc039ffe7522c47c6eb7a5e5ab5", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.6406358594405573, "ground_truth": 0}, {"key": "3ffb4210cf832dc039ffe7522c47c6eb7a5e5ab5", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.6654105509337851, "ground_truth": 0}, {"key": "c010d72bf64ac4e1c758b7f078aeed89bc57a9db", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.4493926357815583, "ground_truth": 0}, {"key": "c010d72bf64ac4e1c758b7f078aeed89bc57a9db", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.3433417361427646, "ground_truth": 0}, {"key": "c010d72bf64ac4e1c758b7f078aeed89bc57a9db", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.5195213269062963, "ground_truth": 0}, {"key": "c010d72bf64ac4e1c758b7f078aeed89bc57a9db", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.7704648003093524, "ground_truth": 0}, {"key": "c010d72bf64ac4e1c758b7f078aeed89bc57a9db", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.5292634055899637, "ground_truth": 0}, {"key": "343644770a597a2dfa7548ba165fa9c6bdc88245", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.7341195327085372, "ground_truth": 0}, {"key": "343644770a597a2dfa7548ba165fa9c6bdc88245", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.4629585936161349, "ground_truth": 0}, {"key": "343644770a597a2dfa7548ba165fa9c6bdc88245", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.6548947071628249, "ground_truth": 0}, {"key": "343644770a597a2dfa7548ba165fa9c6bdc88245", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.6636689522208926, "ground_truth": 0}, {"key": "343644770a597a2dfa7548ba165fa9c6bdc88245", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.7201714933465917, "ground_truth": 0}, {"key": "4b89e8a6a25de61d21a1fed20fb911cd4b1e4b47", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.805632201819562, "ground_truth": 0}, {"key": "4b89e8a6a25de61d21a1fed20fb911cd4b1e4b47", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.6566582854022901, "ground_truth": 0}, {"key": "4b89e8a6a25de61d21a1fed20fb911cd4b1e4b47", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.754914985664038, "ground_truth": 0}, {"key": "4b89e8a6a25de61d21a1fed20fb911cd4b1e4b47", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.5888891443232934, "ground_truth": 0}, {"key": "4b89e8a6a25de61d21a1fed20fb911cd4b1e4b47", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.7279754392497503, "ground_truth": 0}, {"key": "9b382d27692cb18aa61af350038b175b3ce75e2b", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.4359015142383214, "ground_truth": 0}, {"key": "9b382d27692cb18aa61af350038b175b3ce75e2b", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.2829881185321056, "ground_truth": 0}, {"key": "9b382d27692cb18aa61af350038b175b3ce75e2b", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.39420097652190145, "ground_truth": 0}, {"key": "9b382d27692cb18aa61af350038b175b3ce75e2b", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.19072402851376574, "ground_truth": 0}, {"key": "9b382d27692cb18aa61af350038b175b3ce75e2b", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.3328523382708219, "ground_truth": 0}, {"key": "59be27355e5b86754678f70254cfbb1e6dc8bf0c", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.7476159615142055, "ground_truth": 0}, {"key": "59be27355e5b86754678f70254cfbb1e6dc8bf0c", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.6279512285726115, "ground_truth": 0}, {"key": "59be27355e5b86754678f70254cfbb1e6dc8bf0c", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.7074047114608234, "ground_truth": 0}, {"key": "59be27355e5b86754678f70254cfbb1e6dc8bf0c", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.6187804289174366, "ground_truth": 0}, {"key": "59be27355e5b86754678f70254cfbb1e6dc8bf0c", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.668880246162251, "ground_truth": 0}, {"key": "ff10934c1dc127286575fb1a6b192da6da21f235", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.5717665945558615, "ground_truth": 0}, {"key": "ff10934c1dc127286575fb1a6b192da6da21f235", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.68930559650814, "ground_truth": 0}, {"key": "ff10934c1dc127286575fb1a6b192da6da21f235", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.5679365965819471, "ground_truth": 0}, {"key": "ff10934c1dc127286575fb1a6b192da6da21f235", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.5774953820029786, "ground_truth": 0}, {"key": "ff10934c1dc127286575fb1a6b192da6da21f235", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.7106283178661094, "ground_truth": 0}, {"key": "1997690ceabc952c3396cb2a30e9050241f6f6c7", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.5926665757815381, "ground_truth": 0}, {"key": "1997690ceabc952c3396cb2a30e9050241f6f6c7", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.42059959406404973, "ground_truth": 0}, {"key": "1997690ceabc952c3396cb2a30e9050241f6f6c7", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.5214711735659713, "ground_truth": 0}, {"key": "1997690ceabc952c3396cb2a30e9050241f6f6c7", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.43974735745272414, "ground_truth": 0}, {"key": "1997690ceabc952c3396cb2a30e9050241f6f6c7", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.573678400481377, "ground_truth": 0}, {"key": "c676027eea6109621206e3864c4eea30912fe09f", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.44939265102101006, "ground_truth": 0}, {"key": "c676027eea6109621206e3864c4eea30912fe09f", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.23934934382926837, "ground_truth": 0}, {"key": "c676027eea6109621206e3864c4eea30912fe09f", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.5370413961741272, "ground_truth": 0}, {"key": "c676027eea6109621206e3864c4eea30912fe09f", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.3504213723667699, "ground_truth": 0}, {"key": "c676027eea6109621206e3864c4eea30912fe09f", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.27825680654971024, "ground_truth": 0}, {"key": "78e22dd79495204cf719e3728927241bb60b80e1", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.6671476740920138, "ground_truth": 0}, {"key": "78e22dd79495204cf719e3728927241bb60b80e1", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.6039318078036575, "ground_truth": 0}, {"key": "78e22dd79495204cf719e3728927241bb60b80e1", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.39606816302968045, "ground_truth": 0}, {"key": "78e22dd79495204cf719e3728927241bb60b80e1", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.6370307850632809, "ground_truth": 0}, {"key": "78e22dd79495204cf719e3728927241bb60b80e1", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.4843800897221948, "ground_truth": 0}, {"key": "6c1a1cf59028ba2567b0a1941e510c40133da1c0", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.3242353831882017, "ground_truth": 0}, {"key": "6c1a1cf59028ba2567b0a1941e510c40133da1c0", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.6442250824352982, "ground_truth": 0}, {"key": "6c1a1cf59028ba2567b0a1941e510c40133da1c0", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.6132365721671212, "ground_truth": 0}, {"key": "6c1a1cf59028ba2567b0a1941e510c40133da1c0", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.38676342822046694, "ground_truth": 0}, {"key": "6c1a1cf59028ba2567b0a1941e510c40133da1c0", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.6566582609933701, "ground_truth": 0}, {"key": "e8bbd5a77edf96611a4b8efcfbc625ec65985e98", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.6671476740366183, "ground_truth": 0}, {"key": "e8bbd5a77edf96611a4b8efcfbc625ec65985e98", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.7248702710502116, "ground_truth": 0}, {"key": "e8bbd5a77edf96611a4b8efcfbc625ec65985e98", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.7279754418004453, "ground_truth": 0}, {"key": "e8bbd5a77edf96611a4b8efcfbc625ec65985e98", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.5602526584652959, "ground_truth": 0}, {"key": "e8bbd5a77edf96611a4b8efcfbc625ec65985e98", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.699254403667486, "ground_truth": 0}, {"key": "4141e012912dbf29c5e792b8654a9a36094b468c", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.7704647913799489, "ground_truth": 0}, {"key": "4141e012912dbf29c5e792b8654a9a36094b468c", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.7866228148845189, "ground_truth": 0}, {"key": "4141e012912dbf29c5e792b8654a9a36094b468c", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.6169358178499244, "ground_truth": 0}, {"key": "4141e012912dbf29c5e792b8654a9a36094b468c", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.6959583117355306, "ground_truth": 0}, {"key": "4141e012912dbf29c5e792b8654a9a36094b468c", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.692641973153462, "ground_truth": 0}, {"key": "d80fa94dc14601e4b82321e2cf749d6915251a70", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.7732163783003797, "ground_truth": 0}, {"key": "d80fa94dc14601e4b82321e2cf749d6915251a70", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.7704648027411245, "ground_truth": 0}, {"key": "d80fa94dc14601e4b82321e2cf749d6915251a70", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.5331544038697626, "ground_truth": 0}, {"key": "d80fa94dc14601e4b82321e2cf749d6915251a70", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.7371581674394152, "ground_truth": 0}, {"key": "d80fa94dc14601e4b82321e2cf749d6915251a70", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.806852610276757, "ground_truth": 0}, {"key": "11e57b8ed79c4f4b110d81a5cd7152d42411c7a6", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.5621765065221899, "ground_truth": 0}, {"key": "11e57b8ed79c4f4b110d81a5cd7152d42411c7a6", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.373875819474708, "ground_truth": 0}, {"key": "11e57b8ed79c4f4b110d81a5cd7152d42411c7a6", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.687630000011179, "ground_truth": 0}, {"key": "11e57b8ed79c4f4b110d81a5cd7152d42411c7a6", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.6531269166836496, "ground_truth": 0}, {"key": "11e57b8ed79c4f4b110d81a5cd7152d42411c7a6", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.4941408780467424, "ground_truth": 0}, {"key": "b55c390e81c5d1d4fa077338d9daaed8978f710b", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.37570647606663554, "ground_truth": 0}, {"key": "b55c390e81c5d1d4fa077338d9daaed8978f710b", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.5467381436543137, "ground_truth": 0}, {"key": "b55c390e81c5d1d4fa077338d9daaed8978f710b", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.7563575623936429, "ground_truth": 0}, {"key": "b55c390e81c5d1d4fa077338d9daaed8978f710b", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.4765796431540054, "ground_truth": 0}, {"key": "b55c390e81c5d1d4fa077338d9daaed8978f710b", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.6740504799889924, "ground_truth": 0}, {"key": "d46e1849cbbf875ccd018fd778fa6c433cab4694", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.7634837399089809, "ground_truth": 0}, {"key": "d46e1849cbbf875ccd018fd778fa6c433cab4694", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.6601724259091075, "ground_truth": 0}, {"key": "d46e1849cbbf875ccd018fd778fa6c433cab4694", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.7170118836211399, "ground_truth": 0}, {"key": "d46e1849cbbf875ccd018fd778fa6c433cab4694", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.6976089288652266, "ground_truth": 0}, {"key": "d46e1849cbbf875ccd018fd778fa6c433cab4694", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.7772998632799211, "ground_truth": 0}, {"key": "09b582acc63514f671628e1766ff7e99b258fe9a", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.6334102684400603, "ground_truth": 0}, {"key": "09b582acc63514f671628e1766ff7e99b258fe9a", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.5506073701655582, "ground_truth": 0}, {"key": "09b582acc63514f671628e1766ff7e99b258fe9a", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.488283417282765, "ground_truth": 0}, {"key": "09b582acc63514f671628e1766ff7e99b258fe9a", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.6943026642829928, "ground_truth": 0}, {"key": "09b582acc63514f671628e1766ff7e99b258fe9a", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.7592253963794321, "ground_truth": 0}, {"key": "c4afe4db222c094c40bb3f271e37e006bcbebf88", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.5832033467986801, "ground_truth": 0}, {"key": "c4afe4db222c094c40bb3f271e37e006bcbebf88", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.32766829544149084, "ground_truth": 0}, {"key": "c4afe4db222c094c40bb3f271e37e006bcbebf88", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.5253688121013702, "ground_truth": 0}, {"key": "c4afe4db222c094c40bb3f271e37e006bcbebf88", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.5964331582034673, "ground_truth": 0}, {"key": "c4afe4db222c094c40bb3f271e37e006bcbebf88", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.37204877999862224, "ground_truth": 0}, {"key": "e21871892c63ec9638bf1bd3c3a1c3ebdae88796", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.6352224322898492, "ground_truth": 0}, {"key": "e21871892c63ec9638bf1bd3c3a1c3ebdae88796", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.7401743771977742, "ground_truth": 0}, {"key": "e21871892c63ec9638bf1bd3c3a1c3ebdae88796", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.4980468635575421, "ground_truth": 0}, {"key": "e21871892c63ec9638bf1bd3c3a1c3ebdae88796", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.4282334012087465, "ground_truth": 0}, {"key": "e21871892c63ec9638bf1bd3c3a1c3ebdae88796", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.6020615868628427, "ground_truth": 0}, {"key": "065378e265a6d5ff38b2e6748ba66490cf8670a9", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.27825678378395863, "ground_truth": 0}, {"key": "065378e265a6d5ff38b2e6748ba66490cf8670a9", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.4629586060101405, "ground_truth": 0}, {"key": "065378e265a6d5ff38b2e6748ba66490cf8670a9", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.15203224072115323, "ground_truth": 0}, {"key": "065378e265a6d5ff38b2e6748ba66490cf8670a9", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.48047867619054196, "ground_truth": 0}, {"key": "065378e265a6d5ff38b2e6748ba66490cf8670a9", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.5292633749641903, "ground_truth": 0}, {"key": "5852e143b34cc30e94aed29193fc2e1dce37b1b1", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.649578605894627, "ground_truth": 0}, {"key": "5852e143b34cc30e94aed29193fc2e1dce37b1b1", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.8019358374398335, "ground_truth": 0}, {"key": "5852e143b34cc30e94aed29193fc2e1dce37b1b1", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.42250461206958784, "ground_truth": 0}, {"key": "5852e143b34cc30e94aed29193fc2e1dce37b1b1", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.7634837666506186, "ground_truth": 0}, {"key": "5852e143b34cc30e94aed29193fc2e1dce37b1b1", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.590779212544151, "ground_truth": 0}, {"key": "af76b4c33b65666487dcc07f75d37de03ff61207", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.4035668723460682, "ground_truth": 0}, {"key": "af76b4c33b65666487dcc07f75d37de03ff61207", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.7826624821698421, "ground_truth": 0}, {"key": "af76b4c33b65666487dcc07f75d37de03ff61207", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.35756752115560275, "ground_truth": 0}, {"key": "af76b4c33b65666487dcc07f75d37de03ff61207", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.47073661715898973, "ground_truth": 0}, {"key": "af76b4c33b65666487dcc07f75d37de03ff61207", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.6926419853169303, "ground_truth": 0}, {"key": "9918924dbaed44429c58ea3638c3847317b71127", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.45713671690961377, "ground_truth": 0}, {"key": "9918924dbaed44429c58ea3638c3847317b71127", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.4902356209599579, "ground_truth": 0}, {"key": "9918924dbaed44429c58ea3638c3847317b71127", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.7431679843019304, "ground_truth": 0}, {"key": "9918924dbaed44429c58ea3638c3847317b71127", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.6688802644059183, "ground_truth": 0}, {"key": "9918924dbaed44429c58ea3638c3847317b71127", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.7295197600543548, "ground_truth": 0}, {"key": "c87e99f422b46c03ce77e7cd064bff87c076e1ed", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.3056973224905372, "ground_truth": 0}, {"key": "c87e99f422b46c03ce77e7cd064bff87c076e1ed", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.4167966579203968, "ground_truth": 0}, {"key": "c87e99f422b46c03ce77e7cd064bff87c076e1ed", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.4726834701506427, "ground_truth": 0}, {"key": "c87e99f422b46c03ce77e7cd064bff87c076e1ed", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.3398276314804293, "ground_truth": 0}, {"key": "c87e99f422b46c03ce77e7cd064bff87c076e1ed", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.28937171203900264, "ground_truth": 0}, {"key": "aaca402152fbea1b16e14999374f6394520289a8", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.4765796577396782, "ground_truth": 0}, {"key": "aaca402152fbea1b16e14999374f6394520289a8", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.6388352942142382, "ground_truth": 0}, {"key": "aaca402152fbea1b16e14999374f6394520289a8", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.7577943676593745, "ground_truth": 0}, {"key": "aaca402152fbea1b16e14999374f6394520289a8", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.8056321838051534, "ground_truth": 0}, {"key": "aaca402152fbea1b16e14999374f6394520289a8", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.824461930417441, "ground_truth": 0}, {"key": "259d8cccfcb9b9edc00d757ec6efecde6fc06110", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.5136684738185641, "ground_truth": 0}, {"key": "259d8cccfcb9b9edc00d757ec6efecde6fc06110", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.4921881238083819, "ground_truth": 0}, {"key": "259d8cccfcb9b9edc00d757ec6efecde6fc06110", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.6279511995970045, "ground_truth": 0}, {"key": "259d8cccfcb9b9edc00d757ec6efecde6fc06110", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.5698526539548151, "ground_truth": 0}, {"key": "259d8cccfcb9b9edc00d757ec6efecde6fc06110", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.5583269787306804, "ground_truth": 0}, {"key": "d076dbce6e84b20153db61c809d0f01f46ef1f45", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.7490872217638064, "ground_truth": 0}, {"key": "d076dbce6e84b20153db61c809d0f01f46ef1f45", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.8438951161976358, "ground_truth": 0}, {"key": "d076dbce6e84b20153db61c809d0f01f46ef1f45", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.7718434902307004, "ground_truth": 0}, {"key": "d076dbce6e84b20153db61c809d0f01f46ef1f45", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.8714748573914602, "ground_truth": 0}, {"key": "d076dbce6e84b20153db61c809d0f01f46ef1f45", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.9142907246286801, "ground_truth": 0}, {"key": "c74e983d24450ed9c4ba3a97e345bba707d26853", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.8670357604533188, "ground_truth": 0}, {"key": "c74e983d24450ed9c4ba3a97e345bba707d26853", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.7520125790071157, "ground_truth": 0}, {"key": "c74e983d24450ed9c4ba3a97e345bba707d26853", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.811676036659487, "ground_truth": 0}, {"key": "c74e983d24450ed9c4ba3a97e345bba707d26853", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.8548846363958874, "ground_truth": 0}, {"key": "c74e983d24450ed9c4ba3a97e345bba707d26853", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.8548846431359329, "ground_truth": 0}, {"key": "0922357b2d0439cf4ba6ec9dc143e11a38b49d8a", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.4649015587456075, "ground_truth": 0}, {"key": "0922357b2d0439cf4ba6ec9dc143e11a38b49d8a", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.5525397157308677, "ground_truth": 0}, {"key": "0922357b2d0439cf4ba6ec9dc143e11a38b49d8a", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.6808786373496489, "ground_truth": 0}, {"key": "0922357b2d0439cf4ba6ec9dc143e11a38b49d8a", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.42059959038120454, "ground_truth": 0}, {"key": "0922357b2d0439cf4ba6ec9dc143e11a38b49d8a", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.5717666002801076, "ground_truth": 0}, {"key": "c62ea6aaf31a7f5b6a7c2eac7780c86f9baed786", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.6242935420050004, "ground_truth": 0}, {"key": "c62ea6aaf31a7f5b6a7c2eac7780c86f9baed786", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.9190632905437337, "ground_truth": 0}, {"key": "c62ea6aaf31a7f5b6a7c2eac7780c86f9baed786", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.4416730116898011, "ground_truth": 0}, {"key": "c62ea6aaf31a7f5b6a7c2eac7780c86f9baed786", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.76908023548853, "ground_truth": 0}, {"key": "c62ea6aaf31a7f5b6a7c2eac7780c86f9baed786", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.8509647058414346, "ground_truth": 0}, {"key": "6bb04883f35820a450ff821eda46a4002c0fc7e9", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.9219218322196414, "ground_truth": 0}, {"key": "6bb04883f35820a450ff821eda46a4002c0fc7e9", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.6688802679475472, "ground_truth": 0}, {"key": "6bb04883f35820a450ff821eda46a4002c0fc7e9", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.7325918304791009, "ground_truth": 0}, {"key": "6bb04883f35820a450ff821eda46a4002c0fc7e9", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.8969755630113179, "ground_truth": 0}, {"key": "6bb04883f35820a450ff821eda46a4002c0fc7e9", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.8519527978472459, "ground_truth": 0}, {"key": "71f87a7cbda73f1c0656d811b0026437e4ee4aa0", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.7943849513074479, "ground_truth": 0}, {"key": "71f87a7cbda73f1c0656d811b0026437e4ee4aa0", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.8519528163329866, "ground_truth": 0}, {"key": "71f87a7cbda73f1c0656d811b0026437e4ee4aa0", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.6893055906526949, "ground_truth": 0}, {"key": "71f87a7cbda73f1c0656d811b0026437e4ee4aa0", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.7264256100018126, "ground_truth": 0}, {"key": "71f87a7cbda73f1c0656d811b0026437e4ee4aa0", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.7170118733476408, "ground_truth": 0}, {"key": "fa5089d759a9fb810d28c140cf60e3a5fffff8ba", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.7008948036057406, "ground_truth": 0}, {"key": "fa5089d759a9fb810d28c140cf60e3a5fffff8ba", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.33982762433268676, "ground_truth": 0}, {"key": "fa5089d759a9fb810d28c140cf60e3a5fffff8ba", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.6370308103051281, "ground_truth": 0}, {"key": "fa5089d759a9fb810d28c140cf60e3a5fffff8ba", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.5175708645418061, "ground_truth": 0}, {"key": "fa5089d759a9fb810d28c140cf60e3a5fffff8ba", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.6740504831220475, "ground_truth": 0}, {"key": "1f9aed77465301d7f3787a29555754a03728c4b7", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.5869964257336939, "ground_truth": 0}, {"key": "1f9aed77465301d7f3787a29555754a03728c4b7", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.5544704301978663, "ground_truth": 0}, {"key": "1f9aed77465301d7f3787a29555754a03728c4b7", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.3575675170445542, "ground_truth": 0}, {"key": "1f9aed77465301d7f3787a29555754a03728c4b7", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.6723316808501542, "ground_truth": 0}, {"key": "1f9aed77465301d7f3787a29555754a03728c4b7", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.3812195662558299, "ground_truth": 0}, {"key": "7237201bcb7291f2ededb818f901a451356db34b", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.3942009470840598, "ground_truth": 0}, {"key": "7237201bcb7291f2ededb818f901a451356db34b", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.7931059359547994, "ground_truth": 0}, {"key": "7237201bcb7291f2ededb818f901a451356db34b", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.9213576137072028, "ground_truth": 0}, {"key": "7237201bcb7291f2ededb818f901a451356db34b", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.5, "ground_truth": 0}, {"key": "7237201bcb7291f2ededb818f901a451356db34b", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.8723473721354889, "ground_truth": 0}, {"key": "38d13d78fedc889784ffb3cb213a758c758be145", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.43014734588998166, "ground_truth": 0}, {"key": "38d13d78fedc889784ffb3cb213a758c758be145", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.5525397157308677, "ground_truth": 0}, {"key": "38d13d78fedc889784ffb3cb213a758c758be145", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.5717666155642627, "ground_truth": 0}, {"key": "38d13d78fedc889784ffb3cb213a758c758be145", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.4687906132632568, "ground_truth": 0}, {"key": "38d13d78fedc889784ffb3cb213a758c758be145", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.702530041471745, "ground_truth": 0}, {"key": "98fd4b91ec12241a96493471a3e21c9ab96ec523", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.8688267794588139, "ground_truth": 0}, {"key": "98fd4b91ec12241a96493471a3e21c9ab96ec523", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.9507778825575033, "ground_truth": 0}, {"key": "98fd4b91ec12241a96493471a3e21c9ab96ec523", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.8198933237715872, "ground_truth": 0}, {"key": "98fd4b91ec12241a96493471a3e21c9ab96ec523", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.9469902280227253, "ground_truth": 0}, {"key": "98fd4b91ec12241a96493471a3e21c9ab96ec523", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.8300437735095335, "ground_truth": 0}, {"key": "8cefdd23a829375abeb18b9bd44bb053a67dfdf8", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.5156198931131512, "ground_truth": 0}, {"key": "8cefdd23a829375abeb18b9bd44bb053a67dfdf8", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.8558511361194816, "ground_truth": 0}, {"key": "8cefdd23a829375abeb18b9bd44bb053a67dfdf8", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.5888891319176205, "ground_truth": 0}, {"key": "8cefdd23a829375abeb18b9bd44bb053a67dfdf8", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.6406358500355122, "ground_truth": 0}, {"key": "8cefdd23a829375abeb18b9bd44bb053a67dfdf8", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.7786493023276492, "ground_truth": 0}, {"key": "3de916a84cae6c1dee0076f4e5d6e26fc95c3242", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.7662936638072332, "ground_truth": 0}, {"key": "3de916a84cae6c1dee0076f4e5d6e26fc95c3242", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.5544704860690514, "ground_truth": 0}, {"key": "3de916a84cae6c1dee0076f4e5d6e26fc95c3242", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.7994423277047144, "ground_truth": 0}, {"key": "3de916a84cae6c1dee0076f4e5d6e26fc95c3242", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.8840392906457616, "ground_truth": 0}, {"key": "3de916a84cae6c1dee0076f4e5d6e26fc95c3242", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.5774953798845254, "ground_truth": 0}, {"key": "24611abacb038c28a84c76b10165e474ac0fdd7e", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.6020615872447681, "ground_truth": 0}, {"key": "24611abacb038c28a84c76b10165e474ac0fdd7e", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.5926665880503406, "ground_truth": 0}, {"key": "24611abacb038c28a84c76b10165e474ac0fdd7e", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.4092207964115029, "ground_truth": 0}, {"key": "24611abacb038c28a84c76b10165e474ac0fdd7e", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.6334102639179378, "ground_truth": 0}, {"key": "24611abacb038c28a84c76b10165e474ac0fdd7e", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.5755880085820301, "ground_truth": 0}, {"key": "4f3178963b84a0e3625f7486b045872c665073d7", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.20946969764138648, "ground_truth": 0}, {"key": "4f3178963b84a0e3625f7486b045872c665073d7", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.3451052850045403, "ground_truth": 0}, {"key": "4f3178963b84a0e3625f7486b045872c665073d7", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.1677633405308712, "ground_truth": 0}, {"key": "4f3178963b84a0e3625f7486b045872c665073d7", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.3757064704915038, "ground_truth": 0}, {"key": "4f3178963b84a0e3625f7486b045872c665073d7", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.336331044147265, "ground_truth": 0}, {"key": "6ff0470115b556c80229f4305c23afa683c9f8da", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.5869964256826815, "ground_truth": 0}, {"key": "6ff0470115b556c80229f4305c23afa683c9f8da", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.6992544253797247, "ground_truth": 0}, {"key": "6ff0470115b556c80229f4305c23afa683c9f8da", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.734119519556326, "ground_truth": 0}, {"key": "6ff0470115b556c80229f4305c23afa683c9f8da", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.390475832707466, "ground_truth": 0}, {"key": "6ff0470115b556c80229f4305c23afa683c9f8da", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.6095241667330932, "ground_truth": 0}, {"key": "4be9a7e5e9115eb681541c4a8d247ac84f0eb774", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.586996415413254, "ground_truth": 0}, {"key": "4be9a7e5e9115eb681541c4a8d247ac84f0eb774", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.6893056049241215, "ground_truth": 0}, {"key": "4be9a7e5e9115eb681541c4a8d247ac84f0eb774", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.6566582629787849, "ground_truth": 0}, {"key": "4be9a7e5e9115eb681541c4a8d247ac84f0eb774", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.5907792053570127, "ground_truth": 0}, {"key": "4be9a7e5e9115eb681541c4a8d247ac84f0eb774", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.7356416400145981, "ground_truth": 0}, {"key": "de3ba4e29501a10effcbb5a61e7b9c0ab3721669", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.8031737756466625, "ground_truth": 0}, {"key": "de3ba4e29501a10effcbb5a61e7b9c0ab3721669", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.8539127586744337, "ground_truth": 0}, {"key": "de3ba4e29501a10effcbb5a61e7b9c0ab3721669", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.6959583193528338, "ground_truth": 0}, {"key": "de3ba4e29501a10effcbb5a61e7b9c0ab3721669", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.5331544054532915, "ground_truth": 0}, {"key": "de3ba4e29501a10effcbb5a61e7b9c0ab3721669", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.7981867701971667, "ground_truth": 0}, {"key": "d23090b75384c925e7f20b1ec5218394b52eae38", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.4397473487429512, "ground_truth": 0}, {"key": "d23090b75384c925e7f20b1ec5218394b52eae38", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.7154240073673729, "ground_truth": 0}, {"key": "d23090b75384c925e7f20b1ec5218394b52eae38", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.5253688233873072, "ground_truth": 0}, {"key": "d23090b75384c925e7f20b1ec5218394b52eae38", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.6224593105582824, "ground_truth": 0}, {"key": "d23090b75384c925e7f20b1ec5218394b52eae38", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.5506073570774531, "ground_truth": 0}, {"key": "98008fdd5ea99bc7c437d6e1aa86c750bf667415", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.6224593344272148, "ground_truth": 0}, {"key": "98008fdd5ea99bc7c437d6e1aa86c750bf667415", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.4726834580659135, "ground_truth": 0}, {"key": "98008fdd5ea99bc7c437d6e1aa86c750bf667415", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.3415825093749126, "ground_truth": 0}, {"key": "98008fdd5ea99bc7c437d6e1aa86c750bf667415", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.4225046284884666, "ground_truth": 0}, {"key": "98008fdd5ea99bc7c437d6e1aa86c750bf667415", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.5078118530589244, "ground_truth": 0}, {"key": "fd13c81373473f862d0f3559ffbc2a03fa95f492", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.22270014080901177, "ground_truth": 0}, {"key": "fd13c81373473f862d0f3559ffbc2a03fa95f492", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.16238002932416895, "ground_truth": 0}, {"key": "fd13c81373473f862d0f3559ffbc2a03fa95f492", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.32594953254839254, "ground_truth": 0}, {"key": "fd13c81373473f862d0f3559ffbc2a03fa95f492", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.2766905288892547, "ground_truth": 0}, {"key": "fd13c81373473f862d0f3559ffbc2a03fa95f492", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.2407746066870172, "ground_truth": 0}, {"key": "ad275932d9fb03762cc781e06955fb088e165ad9", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.7008948323856516, "ground_truth": 0}, {"key": "ad275932d9fb03762cc781e06955fb088e165ad9", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.4035668458621215, "ground_truth": 0}, {"key": "ad275932d9fb03762cc781e06955fb088e165ad9", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.6825737364190975, "ground_truth": 0}, {"key": "ad275932d9fb03762cc781e06955fb088e165ad9", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.5907792202602572, "ground_truth": 0}, {"key": "ad275932d9fb03762cc781e06955fb088e165ad9", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.4590761427623344, "ground_truth": 0}, {"key": "f9fedde4734d8ac3431c0ed5d338efcd799b1aea", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.35042135536497854, "ground_truth": 0}, {"key": "f9fedde4734d8ac3431c0ed5d338efcd799b1aea", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.3593641624924419, "ground_truth": 0}, {"key": "f9fedde4734d8ac3431c0ed5d338efcd799b1aea", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.37937838278965086, "ground_truth": 0}, {"key": "f9fedde4734d8ac3431c0ed5d338efcd799b1aea", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.26588047324562564, "ground_truth": 0}, {"key": "f9fedde4734d8ac3431c0ed5d338efcd799b1aea", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.39793842792236334, "ground_truth": 0}, {"key": "bbe84a85e38aac4e2cff76da7ce4ed349474db25", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.573678387112946, "ground_truth": 0}, {"key": "bbe84a85e38aac4e2cff76da7ce4ed349474db25", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.6001883584353732, "ground_truth": 0}, {"key": "bbe84a85e38aac4e2cff76da7ce4ed349474db25", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.34864515276040864, "ground_truth": 0}, {"key": "bbe84a85e38aac4e2cff76da7ce4ed349474db25", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.46490155152375146, "ground_truth": 0}, {"key": "bbe84a85e38aac4e2cff76da7ce4ed349474db25", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.5525396941075502, "ground_truth": 0}, {"key": "45884af9aff9abf54fec27f510c3f9ed000fc6e1", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.8019358224599672, "ground_truth": 0}, {"key": "45884af9aff9abf54fec27f510c3f9ed000fc6e1", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.5774953874392463, "ground_truth": 0}, {"key": "45884af9aff9abf54fec27f510c3f9ed000fc6e1", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.5640984735961828, "ground_truth": 0}, {"key": "45884af9aff9abf54fec27f510c3f9ed000fc6e1", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.8333245976172144, "ground_truth": 0}, {"key": "45884af9aff9abf54fec27f510c3f9ed000fc6e1", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.6169358191241622, "ground_truth": 0}, {"key": "59e60ba3c7ea5f5991db8ed4afd368c69e697dde", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.7025300403623438, "ground_truth": 0}, {"key": "59e60ba3c7ea5f5991db8ed4afd368c69e697dde", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.754914990245998, "ground_truth": 0}, {"key": "59e60ba3c7ea5f5991db8ed4afd368c69e697dde", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.9257686308378867, "ground_truth": 0}, {"key": "59e60ba3c7ea5f5991db8ed4afd368c69e697dde", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.7577943650732949, "ground_truth": 0}, {"key": "59e60ba3c7ea5f5991db8ed4afd368c69e697dde", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.8832359877226048, "ground_truth": 0}, {"key": "265ad4cbd8cbad94527db327a39c2d8f33db33ce", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.27669051924211235, "ground_truth": 0}, {"key": "265ad4cbd8cbad94527db327a39c2d8f33db33ce", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.3665897413533757, "ground_truth": 0}, {"key": "265ad4cbd8cbad94527db327a39c2d8f33db33ce", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.4397473287306222, "ground_truth": 0}, {"key": "265ad4cbd8cbad94527db327a39c2d8f33db33ce", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.36840570500334224, "ground_truth": 0}, {"key": "265ad4cbd8cbad94527db327a39c2d8f33db33ce", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.3942009553750262, "ground_truth": 0}, {"key": "54e68f9b7cdd209c09b2a47feef62b9082346031", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.8376199790837845, "ground_truth": 0}, {"key": "54e68f9b7cdd209c09b2a47feef62b9082346031", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.7154239994808672, "ground_truth": 0}, {"key": "54e68f9b7cdd209c09b2a47feef62b9082346031", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.7786492944096914, "ground_truth": 0}, {"key": "54e68f9b7cdd209c09b2a47feef62b9082346031", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.8670357611672878, "ground_truth": 0}, {"key": "54e68f9b7cdd209c09b2a47feef62b9082346031", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.712232171774011, "ground_truth": 0}, {"key": "3b5e3dff560e2233e8370c87e9d92461200f8bd4", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.558326969391339, "ground_truth": 0}, {"key": "3b5e3dff560e2233e8370c87e9d92461200f8bd4", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.4359015130960117, "ground_truth": 0}, {"key": "3b5e3dff560e2233e8370c87e9d92461200f8bd4", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.7704648072167022, "ground_truth": 0}, {"key": "3b5e3dff560e2233e8370c87e9d92461200f8bd4", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.6206216299003225, "ground_truth": 0}, {"key": "3b5e3dff560e2233e8370c87e9d92461200f8bd4", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.6757646035526255, "ground_truth": 0}, {"key": "242c51d129c998a2585feee12e109a2058eb7c2b", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.6352224320764689, "ground_truth": 0}, {"key": "242c51d129c998a2585feee12e109a2058eb7c2b", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.7745833895482909, "ground_truth": 0}, {"key": "242c51d129c998a2585feee12e109a2058eb7c2b", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.4590761197653776, "ground_truth": 0}, {"key": "242c51d129c998a2585feee12e109a2058eb7c2b", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.5350984286694549, "ground_truth": 0}, {"key": "242c51d129c998a2585feee12e109a2058eb7c2b", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.48633152080416775, "ground_truth": 0}, {"key": "5ce92746bc1f4f5cbb25956c1289ffcd7f50f07e", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.6224593361463983, "ground_truth": 0}, {"key": "5ce92746bc1f4f5cbb25956c1289ffcd7f50f07e", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.401687800638875, "ground_truth": 0}, {"key": "5ce92746bc1f4f5cbb25956c1289ffcd7f50f07e", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.4610167893117087, "ground_truth": 0}, {"key": "5ce92746bc1f4f5cbb25956c1289ffcd7f50f07e", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.2509128047228779, "ground_truth": 0}, {"key": "5ce92746bc1f4f5cbb25956c1289ffcd7f50f07e", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.3468730957163089, "ground_truth": 0}, {"key": "2f32a9eebbfa707a264d82a3bef5557f6b3b5f20", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.6388352754693414, "ground_truth": 0}, {"key": "2f32a9eebbfa707a264d82a3bef5557f6b3b5f20", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.8006920017852837, "ground_truth": 0}, {"key": "2f32a9eebbfa707a264d82a3bef5557f6b3b5f20", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.8344068811136395, "ground_truth": 0}, {"key": "2f32a9eebbfa707a264d82a3bef5557f6b3b5f20", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.707404690157257, "ground_truth": 0}, {"key": "2f32a9eebbfa707a264d82a3bef5557f6b3b5f20", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.6566582746429241, "ground_truth": 0}, {"key": "57a373fa7d17600396fcee99164e79c0edccad14", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.7620701008631857, "ground_truth": 0}, {"key": "57a373fa7d17600396fcee99164e79c0edccad14", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.8459424306721742, "ground_truth": 0}, {"key": "57a373fa7d17600396fcee99164e79c0edccad14", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.7233094619512173, "ground_truth": 0}, {"key": "57a373fa7d17600396fcee99164e79c0edccad14", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.9213576208236524, "ground_truth": 0}, {"key": "57a373fa7d17600396fcee99164e79c0edccad14", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.9059898135736736, "ground_truth": 0}, {"key": "9b087c5572cc091c519625d37d1a614b97b8ed30", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.709019139595006, "ground_truth": 0}, {"key": "9b087c5572cc091c519625d37d1a614b97b8ed30", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.6671476974823995, "ground_truth": 0}, {"key": "9b087c5572cc091c519625d37d1a614b97b8ed30", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.4882834098689895, "ground_truth": 0}, {"key": "9b087c5572cc091c519625d37d1a614b97b8ed30", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.5832033619908604, "ground_truth": 0}, {"key": "9b087c5572cc091c519625d37d1a614b97b8ed30", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.5907792123512786, "ground_truth": 0}, {"key": "b5211115ff68e12e759a474a02d3b163211af563", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.7279754503036179, "ground_truth": 0}, {"key": "b5211115ff68e12e759a474a02d3b163211af563", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.858718595709709, "ground_truth": 0}, {"key": "b5211115ff68e12e759a474a02d3b163211af563", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.809275979070813, "ground_truth": 0}, {"key": "b5211115ff68e12e759a474a02d3b163211af563", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.9124361560851075, "ground_truth": 0}, {"key": "b5211115ff68e12e759a474a02d3b163211af563", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.8558511427506145, "ground_truth": 0}, {"key": "6b75abea2de5c9c9952af0427ccec78910ac811f", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.7718434941138496, "ground_truth": 0}, {"key": "6b75abea2de5c9c9952af0427ccec78910ac811f", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.6548947359131021, "ground_truth": 0}, {"key": "6b75abea2de5c9c9952af0427ccec78910ac811f", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.6001883843405992, "ground_truth": 0}, {"key": "6b75abea2de5c9c9952af0427ccec78910ac811f", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.5506073861123346, "ground_truth": 0}, {"key": "6b75abea2de5c9c9952af0427ccec78910ac811f", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.81167601367745, "ground_truth": 0}, {"key": "259cc1db3d4c814dafc02ed071327f65a7b9eaad", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.4746311767759544, "ground_truth": 0}, {"key": "259cc1db3d4c814dafc02ed071327f65a7b9eaad", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.7041601379369035, "ground_truth": 0}, {"key": "259cc1db3d4c814dafc02ed071327f65a7b9eaad", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.3433417477352775, "ground_truth": 0}, {"key": "259cc1db3d4c814dafc02ed071327f65a7b9eaad", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.3904758381938515, "ground_truth": 0}, {"key": "259cc1db3d4c814dafc02ed071327f65a7b9eaad", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.7879311973958564, "ground_truth": 0}, {"key": "3bb1cda1e01cb6e14f6190ced3b1ec3f7ef50de9", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.3904758427835154, "ground_truth": 0}, {"key": "3bb1cda1e01cb6e14f6190ced3b1ec3f7ef50de9", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.4726834693779941, "ground_truth": 0}, {"key": "3bb1cda1e01cb6e14f6190ced3b1ec3f7ef50de9", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.5350984424094892, "ground_truth": 0}, {"key": "3bb1cda1e01cb6e14f6190ced3b1ec3f7ef50de9", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.5175708735184263, "ground_truth": 0}, {"key": "3bb1cda1e01cb6e14f6190ced3b1ec3f7ef50de9", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.6477982013777273, "ground_truth": 0}, {"key": "7afbe903f1f7cdc1af509583649babf481d01729", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.4746311536053725, "ground_truth": 0}, {"key": "7afbe903f1f7cdc1af509583649babf481d01729", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.656658258253501, "ground_truth": 0}, {"key": "7afbe903f1f7cdc1af509583649babf481d01729", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.3123700007190936, "ground_truth": 0}, {"key": "7afbe903f1f7cdc1af509583649babf481d01729", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.5428632741371308, "ground_truth": 0}, {"key": "7afbe903f1f7cdc1af509583649babf481d01729", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.5621764985569476, "ground_truth": 0}, {"key": "79d625a3311f4ff11598a3ae4fca63103e84e9a1", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.7279754505157091, "ground_truth": 0}, {"key": "79d625a3311f4ff11598a3ae4fca63103e84e9a1", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.5058591043514514, "ground_truth": 0}, {"key": "79d625a3311f4ff11598a3ae4fca63103e84e9a1", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.7853085745674023, "ground_truth": 0}, {"key": "79d625a3311f4ff11598a3ae4fca63103e84e9a1", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.5888891341604956, "ground_truth": 0}, {"key": "79d625a3311f4ff11598a3ae4fca63103e84e9a1", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.6671476978273869, "ground_truth": 0}, {"key": "ea6c4267f17d55f1bd9f0950c31ef59565bdc30b", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.47657964626498006, "ground_truth": 0}, {"key": "ea6c4267f17d55f1bd9f0950c31ef59565bdc30b", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.6020615904554191, "ground_truth": 0}, {"key": "ea6c4267f17d55f1bd9f0950c31ef59565bdc30b", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.6548947259536819, "ground_truth": 0}, {"key": "ea6c4267f17d55f1bd9f0950c31ef59565bdc30b", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.5851011563792224, "ground_truth": 0}, {"key": "ea6c4267f17d55f1bd9f0950c31ef59565bdc30b", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.7676898606403034, "ground_truth": 0}, {"key": "851d02b689bec14607574096bb77b9acf53c15ee", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.7676898538198443, "ground_truth": 0}, {"key": "851d02b689bec14607574096bb77b9acf53c15ee", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.8278281537924366, "ground_truth": 0}, {"key": "851d02b689bec14607574096bb77b9acf53c15ee", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.667147675125081, "ground_truth": 0}, {"key": "851d02b689bec14607574096bb77b9acf53c15ee", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.5428632755859405, "ground_truth": 0}, {"key": "851d02b689bec14607574096bb77b9acf53c15ee", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.8596637426351318, "ground_truth": 0}, {"key": "f2d00c8c396698becc18fd2b41ba595c7a3e1cc6", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.9324533081963694, "ground_truth": 0}, {"key": "f2d00c8c396698becc18fd2b41ba595c7a3e1cc6", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.9775429446259063, "ground_truth": 0}, {"key": "f2d00c8c396698becc18fd2b41ba595c7a3e1cc6", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.9367494838380309, "ground_truth": 0}, {"key": "f2d00c8c396698becc18fd2b41ba595c7a3e1cc6", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.9722043750253935, "ground_truth": 0}, {"key": "f2d00c8c396698becc18fd2b41ba595c7a3e1cc6", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.9522199297850096, "ground_truth": 0}, {"key": "70c6ca3234f9b1221c8aea7671dd78e1ca9d9139", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.3757064754260068, "ground_truth": 0}, {"key": "70c6ca3234f9b1221c8aea7671dd78e1ca9d9139", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.39420095091486607, "ground_truth": 0}, {"key": "70c6ca3234f9b1221c8aea7671dd78e1ca9d9139", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.16885694590560033, "ground_truth": 0}, {"key": "70c6ca3234f9b1221c8aea7671dd78e1ca9d9139", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.5195213189842721, "ground_truth": 0}, {"key": "70c6ca3234f9b1221c8aea7671dd78e1ca9d9139", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.2991051924872831, "ground_truth": 0}, {"key": "86eaa90c419d5ed93341248fecd8c25d820f2b82", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.7122321836233818, "ground_truth": 0}, {"key": "86eaa90c419d5ed93341248fecd8c25d820f2b82", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.7341195263025454, "ground_truth": 0}, {"key": "86eaa90c419d5ed93341248fecd8c25d820f2b82", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.5602526609104864, "ground_truth": 0}, {"key": "86eaa90c419d5ed93341248fecd8c25d820f2b82", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.5234203421487744, "ground_truth": 0}, {"key": "86eaa90c419d5ed93341248fecd8c25d820f2b82", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.6876299984566172, "ground_truth": 0}, {"key": "a1841cf61c53937fffc54c0e81d8f7cfcad2f0c2", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.40356685549318216, "ground_truth": 0}, {"key": "a1841cf61c53937fffc54c0e81d8f7cfcad2f0c2", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.4551986205825728, "ground_truth": 0}, {"key": "a1841cf61c53937fffc54c0e81d8f7cfcad2f0c2", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.7505527653312212, "ground_truth": 0}, {"key": "a1841cf61c53937fffc54c0e81d8f7cfcad2f0c2", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.43206340029134416, "ground_truth": 0}, {"key": "a1841cf61c53937fffc54c0e81d8f7cfcad2f0c2", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.6601723767693304, "ground_truth": 0}, {"key": "5d221c86fdadca378eeaabc39c881cc74efcff07", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.35042137948920443, "ground_truth": 0}, {"key": "5d221c86fdadca378eeaabc39c881cc74efcff07", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.38676343749289266, "ground_truth": 0}, {"key": "5d221c86fdadca378eeaabc39c881cc74efcff07", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.4111108552711436, "ground_truth": 0}, {"key": "5d221c86fdadca378eeaabc39c881cc74efcff07", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.40356686494703964, "ground_truth": 0}, {"key": "5d221c86fdadca378eeaabc39c881cc74efcff07", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.46684559176179075, "ground_truth": 0}, {"key": "7a49f5bc1d336309f57076bceba91885ee5368b5", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.9235923283340384, "ground_truth": 0}, {"key": "7a49f5bc1d336309f57076bceba91885ee5368b5", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.9224823435954576, "ground_truth": 0}, {"key": "7a49f5bc1d336309f57076bceba91885ee5368b5", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.7799929224652535, "ground_truth": 0}, {"key": "7a49f5bc1d336309f57076bceba91885ee5368b5", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.8044059103547683, "ground_truth": 0}, {"key": "7a49f5bc1d336309f57076bceba91885ee5368b5", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.9829546828183303, "ground_truth": 0}, {"key": "dd46893fd318dce4e209f9a335612659ebf8fd24", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.6057990198284939, "ground_truth": 0}, {"key": "dd46893fd318dce4e209f9a335612659ebf8fd24", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.7461389824023853, "ground_truth": 0}, {"key": "dd46893fd318dce4e209f9a335612659ebf8fd24", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.5486735076257162, "ground_truth": 0}, {"key": "dd46893fd318dce4e209f9a335612659ebf8fd24", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.7170118874315042, "ground_truth": 0}, {"key": "dd46893fd318dce4e209f9a335612659ebf8fd24", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.724870271053323, "ground_truth": 0}, {"key": "acda8749fba5e9553e9f47cef89ef85eae5ad4e3", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.7520125804595694, "ground_truth": 0}, {"key": "acda8749fba5e9553e9f47cef89ef85eae5ad4e3", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.7025300743061246, "ground_truth": 0}, {"key": "acda8749fba5e9553e9f47cef89ef85eae5ad4e3", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.6893056120867559, "ground_truth": 0}, {"key": "acda8749fba5e9553e9f47cef89ef85eae5ad4e3", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.6791786883844385, "ground_truth": 0}, {"key": "acda8749fba5e9553e9f47cef89ef85eae5ad4e3", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.8210441179364897, "ground_truth": 0}, {"key": "20b11518df6520f552d691d5f6c0d02755d11809", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.5717665909979683, "ground_truth": 0}, {"key": "20b11518df6520f552d691d5f6c0d02755d11809", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.2877678169602223, "ground_truth": 0}, {"key": "20b11518df6520f552d691d5f6c0d02755d11809", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.4824291169220359, "ground_truth": 0}, {"key": "20b11518df6520f552d691d5f6c0d02755d11809", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.36658974856649773, "ground_truth": 0}, {"key": "20b11518df6520f552d691d5f6c0d02755d11809", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.476579657439973, "ground_truth": 0}, {"key": "51fe083191bb5568bf6a5fea1610a8e19663d7b2", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.5602526550163847, "ground_truth": 0}, {"key": "51fe083191bb5568bf6a5fea1610a8e19663d7b2", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.6495786181125062, "ground_truth": 0}, {"key": "51fe083191bb5568bf6a5fea1610a8e19663d7b2", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.6370308345021991, "ground_truth": 0}, {"key": "51fe083191bb5568bf6a5fea1610a8e19663d7b2", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.4073333873316044, "ground_truth": 0}, {"key": "51fe083191bb5568bf6a5fea1610a8e19663d7b2", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.5097644006554876, "ground_truth": 0}, {"key": "8af047c2d83a91e8b745adfcaa7c282dfe1030a2", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.2422056414771597, "ground_truth": 0}, {"key": "8af047c2d83a91e8b745adfcaa7c282dfe1030a2", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.51757088695625, "ground_truth": 0}, {"key": "8af047c2d83a91e8b745adfcaa7c282dfe1030a2", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.3923368290188146, "ground_truth": 0}, {"key": "8af047c2d83a91e8b745adfcaa7c282dfe1030a2", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.28616925644766317, "ground_truth": 0}, {"key": "8af047c2d83a91e8b745adfcaa7c282dfe1030a2", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.4092207942188375, "ground_truth": 0}, {"key": "dfcacd955a9168b2cf599c57a539dbfce43ea2a9", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.7201714975434088, "ground_truth": 0}, {"key": "dfcacd955a9168b2cf599c57a539dbfce43ea2a9", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.4863315418484844, "ground_truth": 0}, {"key": "dfcacd955a9168b2cf599c57a539dbfce43ea2a9", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.36658974011405804, "ground_truth": 0}, {"key": "dfcacd955a9168b2cf599c57a539dbfce43ea2a9", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.6334102620402056, "ground_truth": 0}, {"key": "dfcacd955a9168b2cf599c57a539dbfce43ea2a9", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.4610167933455185, "ground_truth": 0}, {"key": "f2463954bc7215d8a1f98cf0d85f280fd2affa58", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.7461390148871454, "ground_truth": 0}, {"key": "f2463954bc7215d8a1f98cf0d85f280fd2affa58", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.821044108652266, "ground_truth": 0}, {"key": "f2463954bc7215d8a1f98cf0d85f280fd2affa58", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.8757869955901207, "ground_truth": 0}, {"key": "f2463954bc7215d8a1f98cf0d85f280fd2affa58", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.7534666817209136, "ground_truth": 0}, {"key": "f2463954bc7215d8a1f98cf0d85f280fd2affa58", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.8198933380879943, "ground_truth": 0}, {"key": "0e7a92a6f06e94cdd613860d4a3f4b92a06a2b43", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.5679365892568914, "ground_truth": 0}, {"key": "0e7a92a6f06e94cdd613860d4a3f4b92a06a2b43", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.7371581430757942, "ground_truth": 0}, {"key": "0e7a92a6f06e94cdd613860d4a3f4b92a06a2b43", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.6076631861654159, "ground_truth": 0}, {"key": "0e7a92a6f06e94cdd613860d4a3f4b92a06a2b43", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.48047865980433596, "ground_truth": 0}, {"key": "0e7a92a6f06e94cdd613860d4a3f4b92a06a2b43", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.8624675393018302, "ground_truth": 0}, {"key": "2905a15c5947042e42f4b52dc201d24822af20f1", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.7431679896868459, "ground_truth": 0}, {"key": "2905a15c5947042e42f4b52dc201d24822af20f1", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.8210440925886996, "ground_truth": 0}, {"key": "2905a15c5947042e42f4b52dc201d24822af20f1", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.663668960898405, "ground_truth": 0}, {"key": "2905a15c5947042e42f4b52dc201d24822af20f1", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.6842640185130434, "ground_truth": 0}, {"key": "2905a15c5947042e42f4b52dc201d24822af20f1", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.7620701080660043, "ground_truth": 0}, {"key": "808a3d788317af05686ee71a71d2fbc5c19267bc", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.6859494555291491, "ground_truth": 0}, {"key": "808a3d788317af05686ee71a71d2fbc5c19267bc", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.5888891123214017, "ground_truth": 0}, {"key": "808a3d788317af05686ee71a71d2fbc5c19267bc", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.6740505044242086, "ground_truth": 0}, {"key": "808a3d788317af05686ee71a71d2fbc5c19267bc", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.5409238476034451, "ground_truth": 0}, {"key": "808a3d788317af05686ee71a71d2fbc5c19267bc", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.6477981894719317, "ground_truth": 0}, {"key": "5a1bec30205b6938392f3119366e27d15b4849e8", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.6001883667310016, "ground_truth": 0}, {"key": "5a1bec30205b6938392f3119366e27d15b4849e8", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.6757646069433535, "ground_truth": 0}, {"key": "5a1bec30205b6938392f3119366e27d15b4849e8", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.38491212813951875, "ground_truth": 0}, {"key": "5a1bec30205b6938392f3119366e27d15b4849e8", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.5869964340157687, "ground_truth": 0}, {"key": "5a1bec30205b6938392f3119366e27d15b4849e8", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.4282333945498318, "ground_truth": 0}, {"key": "7ff39e1220c0f084434786ed145e15c6abe48def", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.5964331410227769, "ground_truth": 0}, {"key": "7ff39e1220c0f084434786ed145e15c6abe48def", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.5869964439198766, "ground_truth": 0}, {"key": "7ff39e1220c0f084434786ed145e15c6abe48def", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.687629999525527, "ground_truth": 0}, {"key": "7ff39e1220c0f084434786ed145e15c6abe48def", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.7025300586723052, "ground_truth": 0}, {"key": "7ff39e1220c0f084434786ed145e15c6abe48def", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.7295197895075398, "ground_truth": 0}, {"key": "7551503e7e57bd519913b0df90ca1e80d5305b05", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.5097644082261582, "ground_truth": 0}, {"key": "7551503e7e57bd519913b0df90ca1e80d5305b05", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.3960681348286628, "ground_truth": 0}, {"key": "7551503e7e57bd519913b0df90ca1e80d5305b05", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.6619228820472857, "ground_truth": 0}, {"key": "7551503e7e57bd519913b0df90ca1e80d5305b05", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.30569734291673556, "ground_truth": 0}, {"key": "7551503e7e57bd519913b0df90ca1e80d5305b05", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.6740504808465783, "ground_truth": 0}, {"key": "c34a0cbf6db61323766fc86b1b89b399ff6b0666", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.5156199093051061, "ground_truth": 0}, {"key": "c34a0cbf6db61323766fc86b1b89b399ff6b0666", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.5926666010058323, "ground_truth": 0}, {"key": "c34a0cbf6db61323766fc86b1b89b399ff6b0666", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.5389832218533983, "ground_truth": 0}, {"key": "c34a0cbf6db61323766fc86b1b89b399ff6b0666", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.4824291109247259, "ground_truth": 0}, {"key": "c34a0cbf6db61323766fc86b1b89b399ff6b0666", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.4863315199893155, "ground_truth": 0}, {"key": "d07a61368a195444b14bd4b382e0fc3d64890b22", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.6113819775876668, "ground_truth": 0}, {"key": "d07a61368a195444b14bd4b382e0fc3d64890b22", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.4359015219564841, "ground_truth": 0}, {"key": "d07a61368a195444b14bd4b382e0fc3d64890b22", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.5350984274440788, "ground_truth": 0}, {"key": "d07a61368a195444b14bd4b382e0fc3d64890b22", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.6688802538779739, "ground_truth": 0}, {"key": "d07a61368a195444b14bd4b382e0fc3d64890b22", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.42250462987859766, "ground_truth": 0}, {"key": "aa68dee4bc246e5aae9507342f8520a2a301a310", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.39420093920180505, "ground_truth": 0}, {"key": "aa68dee4bc246e5aae9507342f8520a2a301a310", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.6279512347031753, "ground_truth": 0}, {"key": "aa68dee4bc246e5aae9507342f8520a2a301a310", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.2628418467869184, "ground_truth": 0}, {"key": "aa68dee4bc246e5aae9507342f8520a2a301a310", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.3504213853350935, "ground_truth": 0}, {"key": "aa68dee4bc246e5aae9507342f8520a2a301a310", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.5621765233479613, "ground_truth": 0}, {"key": "87ef15064035db73cb29f5cec2f0442f2c527ef0", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.7505527579093548, "ground_truth": 0}, {"key": "87ef15064035db73cb29f5cec2f0442f2c527ef0", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.7416740283594144, "ground_truth": 0}, {"key": "87ef15064035db73cb29f5cec2f0442f2c527ef0", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.47657966855857836, "ground_truth": 0}, {"key": "87ef15064035db73cb29f5cec2f0442f2c527ef0", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.7918210808697561, "ground_truth": 0}, {"key": "87ef15064035db73cb29f5cec2f0442f2c527ef0", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.6076631840067073, "ground_truth": 0}, {"key": "a577b934e210ef7dce07390711f03db8bb2e005a", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.6334102694784587, "ground_truth": 0}, {"key": "a577b934e210ef7dce07390711f03db8bb2e005a", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.8140527883117834, "ground_truth": 0}, {"key": "a577b934e210ef7dce07390711f03db8bb2e005a", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.5214711454594171, "ground_truth": 0}, {"key": "a577b934e210ef7dce07390711f03db8bb2e005a", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.7505527645331257, "ground_truth": 0}, {"key": "a577b934e210ef7dce07390711f03db8bb2e005a", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.6388352729594917, "ground_truth": 0}, {"key": "c9414bf55859cb9ca7e925a4a09b416b6f66446a", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.9829546826026461, "ground_truth": 0}, {"key": "c9414bf55859cb9ca7e925a4a09b416b6f66446a", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.9901401444728384, "ground_truth": 0}, {"key": "c9414bf55859cb9ca7e925a4a09b416b6f66446a", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.9915543729406121, "ground_truth": 0}, {"key": "c9414bf55859cb9ca7e925a4a09b416b6f66446a", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.9849273713743272, "ground_truth": 0}, {"key": "c9414bf55859cb9ca7e925a4a09b416b6f66446a", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.9925969856647964, "ground_truth": 0}, {"key": "f12cda150b96acfa1499b2afb0a81029545abadf", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.6757646008285739, "ground_truth": 0}, {"key": "f12cda150b96acfa1499b2afb0a81029545abadf", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.667147666754728, "ground_truth": 0}, {"key": "f12cda150b96acfa1499b2afb0a81029545abadf", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.7839884671376373, "ground_truth": 0}, {"key": "f12cda150b96acfa1499b2afb0a81029545abadf", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.7931059429717451, "ground_truth": 0}, {"key": "f12cda150b96acfa1499b2afb0a81029545abadf", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.8633916030635319, "ground_truth": 0}, {"key": "7359741b0e60b4402f069963a26c7aa766f45e7c", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.35936414616753976, "ground_truth": 0}, {"key": "7359741b0e60b4402f069963a26c7aa766f45e7c", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.531209349601562, "ground_truth": 0}, {"key": "7359741b0e60b4402f069963a26c7aa766f45e7c", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.31573597116784147, "ground_truth": 0}, {"key": "7359741b0e60b4402f069963a26c7aa766f45e7c", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.7233094656333812, "ground_truth": 0}, {"key": "7359741b0e60b4402f069963a26c7aa766f45e7c", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.7745834018629589, "ground_truth": 0}, {"key": "b10c71f49dbeabad23325d625e8e7b8529429607", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.7341195285889428, "ground_truth": 0}, {"key": "b10c71f49dbeabad23325d625e8e7b8529429607", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.5698526488894754, "ground_truth": 0}, {"key": "b10c71f49dbeabad23325d625e8e7b8529429607", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.5, "ground_truth": 0}, {"key": "b10c71f49dbeabad23325d625e8e7b8529429607", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.618780409092974, "ground_truth": 0}, {"key": "b10c71f49dbeabad23325d625e8e7b8529429607", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.7563575346477809, "ground_truth": 0}, {"key": "c5a1e04f5f84d406ffedfc2f312c314d1bc03c46", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.4148988560495028, "ground_truth": 0}, {"key": "c5a1e04f5f84d406ffedfc2f312c314d1bc03c46", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.29421496578967055, "ground_truth": 0}, {"key": "c5a1e04f5f84d406ffedfc2f312c314d1bc03c46", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.3157359792116064, "ground_truth": 0}, {"key": "c5a1e04f5f84d406ffedfc2f312c314d1bc03c46", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.28937169739225715, "ground_truth": 0}, {"key": "c5a1e04f5f84d406ffedfc2f312c314d1bc03c46", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.39233684616307274, "ground_truth": 0}, {"key": "8a5035d3527c4db4357dd1db9fb2712008dccea9", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.5389832065437004, "ground_truth": 0}, {"key": "8a5035d3527c4db4357dd1db9fb2712008dccea9", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.42441199941384716, "ground_truth": 0}, {"key": "8a5035d3527c4db4357dd1db9fb2712008dccea9", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.26435836110862504, "ground_truth": 0}, {"key": "8a5035d3527c4db4357dd1db9fb2712008dccea9", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.6584174994519499, "ground_truth": 0}, {"key": "8a5035d3527c4db4357dd1db9fb2712008dccea9", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.5888891318026374, "ground_truth": 0}, {"key": "3f33d4cb25cd121619ba99eeb02709b72716d622", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.8910549551289957, "ground_truth": 0}, {"key": "3f33d4cb25cd121619ba99eeb02709b72716d622", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.8723473816342294, "ground_truth": 0}, {"key": "3f33d4cb25cd121619ba99eeb02709b72716d622", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.6334102786569497, "ground_truth": 0}, {"key": "3f33d4cb25cd121619ba99eeb02709b72716d622", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.8397339718987344, "ground_truth": 0}, {"key": "3f33d4cb25cd121619ba99eeb02709b72716d622", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.9086178908042831, "ground_truth": 0}, {"key": "e6f451d6667f142a64818a9d05dbc49115e7cbf9", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.5506073655246155, "ground_truth": 0}, {"key": "e6f451d6667f142a64818a9d05dbc49115e7cbf9", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.6909762613840544, "ground_truth": 0}, {"key": "e6f451d6667f142a64818a9d05dbc49115e7cbf9", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.7592254207425797, "ground_truth": 0}, {"key": "e6f451d6667f142a64818a9d05dbc49115e7cbf9", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.45907610624556505, "ground_truth": 0}, {"key": "e6f451d6667f142a64818a9d05dbc49115e7cbf9", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.6513548781407482, "ground_truth": 0}, {"key": "39622c01625247af942a6439699ff529db1d54d0", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.12421301322629127, "ground_truth": 0}, {"key": "39622c01625247af942a6439699ff529db1d54d0", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.2309197500884793, "ground_truth": 0}, {"key": "39622c01625247af942a6439699ff529db1d54d0", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.4130035611691611, "ground_truth": 0}, {"key": "39622c01625247af942a6439699ff529db1d54d0", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.2782567993327179, "ground_truth": 0}, {"key": "39622c01625247af942a6439699ff529db1d54d0", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.2861692552548459, "ground_truth": 0}, {"key": "02927c88776bcc84fc883435a5037b4c8ca70e83", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.818736802010509, "ground_truth": 0}, {"key": "02927c88776bcc84fc883435a5037b4c8ca70e83", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.8766343715568382, "ground_truth": 0}, {"key": "02927c88776bcc84fc883435a5037b4c8ca70e83", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.7718435019813001, "ground_truth": 0}, {"key": "02927c88776bcc84fc883435a5037b4c8ca70e83", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.8606036210093795, "ground_truth": 0}, {"key": "02927c88776bcc84fc883435a5037b4c8ca70e83", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.6992544108357848, "ground_truth": 0}, {"key": "3ee31d8987c07ba4ea9423d39c5e333525316958", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.6825737251085612, "ground_truth": 0}, {"key": "3ee31d8987c07ba4ea9423d39c5e333525316958", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.8116760154156917, "ground_truth": 0}, {"key": "3ee31d8987c07ba4ea9423d39c5e333525316958", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.8267117976284761, "ground_truth": 0}, {"key": "3ee31d8987c07ba4ea9423d39c5e333525316958", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.8577681151165616, "ground_truth": 0}, {"key": "3ee31d8987c07ba4ea9423d39c5e333525316958", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.8832359929358325, "ground_truth": 0}, {"key": "f8ddc6d36f378757d27a244529f8fe11672baa41", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.47463117676874356, "ground_truth": 0}, {"key": "f8ddc6d36f378757d27a244529f8fe11672baa41", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.6132365577131945, "ground_truth": 0}, {"key": "f8ddc6d36f378757d27a244529f8fe11672baa41", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.30239106670700183, "ground_truth": 0}, {"key": "f8ddc6d36f378757d27a244529f8fe11672baa41", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.4455295594092613, "ground_truth": 0}, {"key": "f8ddc6d36f378757d27a244529f8fe11672baa41", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.6619228646138765, "ground_truth": 0}, {"key": "4e97228ceef1be54ab9151fc6759017e6a54a18d", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.5640984826809635, "ground_truth": 0}, {"key": "4e97228ceef1be54ab9151fc6759017e6a54a18d", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.690976273834233, "ground_truth": 0}, {"key": "4e97228ceef1be54ab9151fc6759017e6a54a18d", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.6001883572751917, "ground_truth": 0}, {"key": "4e97228ceef1be54ab9151fc6759017e6a54a18d", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.5813030761793775, "ground_truth": 0}, {"key": "4e97228ceef1be54ab9151fc6759017e6a54a18d", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.6825737516648154, "ground_truth": 0}, {"key": "0e649ccabaf0e650e9757ee256c2749d37486ba6", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.6740504841779049, "ground_truth": 0}, {"key": "0e649ccabaf0e650e9757ee256c2749d37486ba6", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.5869964389796094, "ground_truth": 0}, {"key": "0e649ccabaf0e650e9757ee256c2749d37486ba6", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.5602526537174918, "ground_truth": 0}, {"key": "0e649ccabaf0e650e9757ee256c2749d37486ba6", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.5640984936047497, "ground_truth": 0}, {"key": "0e649ccabaf0e650e9757ee256c2749d37486ba6", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.6909762878598354, "ground_truth": 0}, {"key": "9eccfcc231c7c0d65cb0c333cb3d1731a5fe2f3f", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.6531269151513256, "ground_truth": 0}, {"key": "9eccfcc231c7c0d65cb0c333cb3d1731a5fe2f3f", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.6334102545695832, "ground_truth": 0}, {"key": "9eccfcc231c7c0d65cb0c333cb3d1731a5fe2f3f", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.43398146248822733, "ground_truth": 0}, {"key": "9eccfcc231c7c0d65cb0c333cb3d1731a5fe2f3f", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.4863315569311073, "ground_truth": 0}, {"key": "9eccfcc231c7c0d65cb0c333cb3d1731a5fe2f3f", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.41679666821039774, "ground_truth": 0}, {"key": "ddf109b3de6022a4ecd62ee2cd31d2c2ac51035b", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.3812195581159754, "ground_truth": 0}, {"key": "ddf109b3de6022a4ecd62ee2cd31d2c2ac51035b", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.5660185381119156, "ground_truth": 0}, {"key": "ddf109b3de6022a4ecd62ee2cd31d2c2ac51035b", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.6001883464277883, "ground_truth": 0}, {"key": "ddf109b3de6022a4ecd62ee2cd31d2c2ac51035b", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.2267836404237518, "ground_truth": 0}, {"key": "ddf109b3de6022a4ecd62ee2cd31d2c2ac51035b", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.40356687212359815, "ground_truth": 0}, {"key": "bd92eab23374d95ac4430e2e1a8bf7561c662309", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.7248702782242609, "ground_truth": 0}, {"key": "bd92eab23374d95ac4430e2e1a8bf7561c662309", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.9124361558408185, "ground_truth": 0}, {"key": "bd92eab23374d95ac4430e2e1a8bf7561c662309", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.6943026669607087, "ground_truth": 0}, {"key": "bd92eab23374d95ac4430e2e1a8bf7561c662309", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.8509647131651398, "ground_truth": 0}, {"key": "bd92eab23374d95ac4430e2e1a8bf7561c662309", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.8774767814058998, "ground_truth": 0}, {"key": "d84440effc748f9220c7dde068962e803f566bc7", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.7057850307152709, "ground_truth": 0}, {"key": "d84440effc748f9220c7dde068962e803f566bc7", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.31912140472031275, "ground_truth": 0}, {"key": "d84440effc748f9220c7dde068962e803f566bc7", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.6057990365866722, "ground_truth": 0}, {"key": "d84440effc748f9220c7dde068962e803f566bc7", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.7853085732618655, "ground_truth": 0}, {"key": "d84440effc748f9220c7dde068962e803f566bc7", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.394200964721442, "ground_truth": 0}, {"key": "e2866f596c85b0191ce812260d23855c70a01192", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.4148988698063476, "ground_truth": 0}, {"key": "e2866f596c85b0191ce812260d23855c70a01192", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.6169358181772344, "ground_truth": 0}, {"key": "e2866f596c85b0191ce812260d23855c70a01192", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.39233682432050204, "ground_truth": 0}, {"key": "e2866f596c85b0191ce812260d23855c70a01192", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.48047865909944387, "ground_truth": 0}, {"key": "e2866f596c85b0191ce812260d23855c70a01192", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.6315943254183298, "ground_truth": 0}, {"key": "4ebd9195bc8c12272b6281a5a610a7b5fb49b8cd", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.6926419790519637, "ground_truth": 0}, {"key": "4ebd9195bc8c12272b6281a5a610a7b5fb49b8cd", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.7718435153152717, "ground_truth": 0}, {"key": "4ebd9195bc8c12272b6281a5a610a7b5fb49b8cd", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.8428631404953106, "ground_truth": 0}, {"key": "4ebd9195bc8c12272b6281a5a610a7b5fb49b8cd", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.697608916432877, "ground_truth": 0}, {"key": "4ebd9195bc8c12272b6281a5a610a7b5fb49b8cd", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.8244619304132409, "ground_truth": 0}, {"key": "4bd37aa7004cd1fdf1ccb506d2159a2cf26995e0", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.6876300042259081, "ground_truth": 0}, {"key": "4bd37aa7004cd1fdf1ccb506d2159a2cf26995e0", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.6020616165506334, "ground_truth": 0}, {"key": "4bd37aa7004cd1fdf1ccb506d2159a2cf26995e0", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.699254429199505, "ground_truth": 0}, {"key": "4bd37aa7004cd1fdf1ccb506d2159a2cf26995e0", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.6859494631841885, "ground_truth": 0}, {"key": "4bd37aa7004cd1fdf1ccb506d2159a2cf26995e0", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.8568122942472969, "ground_truth": 0}, {"key": "29b87dc549b8c64b35517e684e79b1da6316bd88", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.6132365486660235, "ground_truth": 0}, {"key": "29b87dc549b8c64b35517e684e79b1da6316bd88", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.5621765049871014, "ground_truth": 0}, {"key": "29b87dc549b8c64b35517e684e79b1da6316bd88", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.6531269384855148, "ground_truth": 0}, {"key": "29b87dc549b8c64b35517e684e79b1da6316bd88", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.39793839445070706, "ground_truth": 0}, {"key": "29b87dc549b8c64b35517e684e79b1da6316bd88", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.25982563448050633, "ground_truth": 0}, {"key": "d2f2fe0b8797b416bae71305c9d1c874e2fdd0cc", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.6297746040850101, "ground_truth": 0}, {"key": "d2f2fe0b8797b416bae71305c9d1c874e2fdd0cc", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.3886180310654031, "ground_truth": 0}, {"key": "d2f2fe0b8797b416bae71305c9d1c874e2fdd0cc", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.5448014060042883, "ground_truth": 0}, {"key": "d2f2fe0b8797b416bae71305c9d1c874e2fdd0cc", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.548673502942664, "ground_truth": 0}, {"key": "d2f2fe0b8797b416bae71305c9d1c874e2fdd0cc", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.5039061481038903, "ground_truth": 0}, {"key": "0269d39abbea3edadd225fa97d818f5a789b4c72", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.6513548485524072, "ground_truth": 0}, {"key": "0269d39abbea3edadd225fa97d818f5a789b4c72", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.5660185381119156, "ground_truth": 0}, {"key": "0269d39abbea3edadd225fa97d818f5a789b4c72", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.505859121305573, "ground_truth": 0}, {"key": "0269d39abbea3edadd225fa97d818f5a789b4c72", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.33111973385684745, "ground_truth": 0}, {"key": "0269d39abbea3edadd225fa97d818f5a789b4c72", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.3979384065727894, "ground_truth": 0}, {"key": "394f20c9bee9bc8d0e6a65bac48de57bd9f4733d", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.8459424278263324, "ground_truth": 0}, {"key": "394f20c9bee9bc8d0e6a65bac48de57bd9f4733d", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.7799929130042452, "ground_truth": 0}, {"key": "394f20c9bee9bc8d0e6a65bac48de57bd9f4733d", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.5467381607053607, "ground_truth": 0}, {"key": "394f20c9bee9bc8d0e6a65bac48de57bd9f4733d", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.7248702707593415, "ground_truth": 0}, {"key": "394f20c9bee9bc8d0e6a65bac48de57bd9f4733d", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.8766343740568247, "ground_truth": 0}, {"key": "6e63c8b1ae01ab91b4832222edaf4bb461b6c568", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.7170119221427255, "ground_truth": 0}, {"key": "6e63c8b1ae01ab91b4832222edaf4bb461b6c568", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.712232175320131, "ground_truth": 0}, {"key": "6e63c8b1ae01ab91b4832222edaf4bb461b6c568", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.759225407465538, "ground_truth": 0}, {"key": "6e63c8b1ae01ab91b4832222edaf4bb461b6c568", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.779992902032121, "ground_truth": 0}, {"key": "6e63c8b1ae01ab91b4832222edaf4bb461b6c568", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.6825737267301629, "ground_truth": 0}, {"key": "355875856932fd634aaf7c6b26155403aaf15904", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.9196425344271791, "ground_truth": 0}, {"key": "355875856932fd634aaf7c6b26155403aaf15904", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.6169358137194568, "ground_truth": 0}, {"key": "355875856932fd634aaf7c6b26155403aaf15904", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.8714748684335423, "ground_truth": 0}, {"key": "355875856932fd634aaf7c6b26155403aaf15904", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.8587185786708753, "ground_truth": 0}, {"key": "355875856932fd634aaf7c6b26155403aaf15904", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.8300437605616431, "ground_truth": 0}, {"key": "999523913d281ab57977d79b644f3879ac4d2e37", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.2814055974956792, "ground_truth": 0}, {"key": "999523913d281ab57977d79b644f3879ac4d2e37", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.21337716309198315, "ground_truth": 0}, {"key": "999523913d281ab57977d79b644f3879ac4d2e37", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.46295860359539515, "ground_truth": 0}, {"key": "999523913d281ab57977d79b644f3879ac4d2e37", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.40733340033989346, "ground_truth": 0}, {"key": "999523913d281ab57977d79b644f3879ac4d2e37", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.413003554862381, "ground_truth": 0}, {"key": "5f7424604ec11358dc6fdfa47732f90422949041", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.3738757928764049, "ground_truth": 0}, {"key": "5f7424604ec11358dc6fdfa47732f90422949041", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.3849121322935672, "ground_truth": 0}, {"key": "5f7424604ec11358dc6fdfa47732f90422949041", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.6352224376897266, "ground_truth": 0}, {"key": "5f7424604ec11358dc6fdfa47732f90422949041", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.5832033570477335, "ground_truth": 0}, {"key": "5f7424604ec11358dc6fdfa47732f90422949041", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.5058591233996594, "ground_truth": 0}, {"key": "fdb2b65b9cb99b7d52559ae647cae293cb5910d3", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.7534666501972714, "ground_truth": 0}, {"key": "fdb2b65b9cb99b7d52559ae647cae293cb5910d3", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.5755880269342915, "ground_truth": 0}, {"key": "fdb2b65b9cb99b7d52559ae647cae293cb5910d3", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.6001883520324107, "ground_truth": 0}, {"key": "fdb2b65b9cb99b7d52559ae647cae293cb5910d3", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.5640984671558854, "ground_truth": 0}, {"key": "fdb2b65b9cb99b7d52559ae647cae293cb5910d3", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.7025300431358558, "ground_truth": 0}, {"key": "f974fe1b3777ffc5756322c0bb3f31a9b23ec09a", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.4436004185933552, "ground_truth": 0}, {"key": "f974fe1b3777ffc5756322c0bb3f31a9b23ec09a", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.6039318419920576, "ground_truth": 0}, {"key": "f974fe1b3777ffc5756322c0bb3f31a9b23ec09a", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.48242909350301616, "ground_truth": 0}, {"key": "f974fe1b3777ffc5756322c0bb3f31a9b23ec09a", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.4726834662645996, "ground_truth": 0}, {"key": "f974fe1b3777ffc5756322c0bb3f31a9b23ec09a", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.631594277097808, "ground_truth": 0}, {"key": "2930e1a7ac24bce649bfbf5f5971e74515e38a0a", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.7057850279352862, "ground_truth": 0}, {"key": "2930e1a7ac24bce649bfbf5f5971e74515e38a0a", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.7154239697407869, "ground_truth": 0}, {"key": "2930e1a7ac24bce649bfbf5f5971e74515e38a0a", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.734119549576626, "ground_truth": 0}, {"key": "2930e1a7ac24bce649bfbf5f5971e74515e38a0a", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.8044059264902941, "ground_truth": 0}, {"key": "2930e1a7ac24bce649bfbf5f5971e74515e38a0a", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.7662936593160412, "ground_truth": 0}, {"key": "f5f7571a69e96c1d288d939861b7216c2bdc0ae4", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.5774953683705001, "ground_truth": 0}, {"key": "f5f7571a69e96c1d288d939861b7216c2bdc0ae4", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.6406358459109633, "ground_truth": 0}, {"key": "f5f7571a69e96c1d288d939861b7216c2bdc0ae4", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.4551986176995325, "ground_truth": 0}, {"key": "f5f7571a69e96c1d288d939861b7216c2bdc0ae4", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.4960938329769206, "ground_truth": 0}, {"key": "f5f7571a69e96c1d288d939861b7216c2bdc0ae4", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.3960681772754855, "ground_truth": 0}, {"key": "5f02aa32bd1dc95e47355755398e31550b232f8a", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.5253688156325529, "ground_truth": 0}, {"key": "5f02aa32bd1dc95e47355755398e31550b232f8a", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.5467381474436291, "ground_truth": 0}, {"key": "5f02aa32bd1dc95e47355755398e31550b232f8a", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.6279512081086924, "ground_truth": 0}, {"key": "5f02aa32bd1dc95e47355755398e31550b232f8a", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.6388352703249847, "ground_truth": 0}, {"key": "5f02aa32bd1dc95e47355755398e31550b232f8a", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.4668455849847913, "ground_truth": 0}, {"key": "9177e5ac94f038749e8d4eb526a65461e0f6df4c", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.5097644036527095, "ground_truth": 0}, {"key": "9177e5ac94f038749e8d4eb526a65461e0f6df4c", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.5467381693126706, "ground_truth": 0}, {"key": "9177e5ac94f038749e8d4eb526a65461e0f6df4c", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.29421495966028, "ground_truth": 0}, {"key": "9177e5ac94f038749e8d4eb526a65461e0f6df4c", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.252384048385103, "ground_truth": 0}, {"key": "9177e5ac94f038749e8d4eb526a65461e0f6df4c", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.49218814144996953, "ground_truth": 0}, {"key": "f12e4bbb07211de7d43b4e331dc73404aa804562", "model": "xsum_2_ft_llama", "target_model": "llama", "recognition_score": 0.9742394416736686, "ground_truth": 0}, {"key": "f12e4bbb07211de7d43b4e331dc73404aa804562", "model": "xsum_2_ft_llama", "target_model": "human", "recognition_score": 0.9572777990041151, "ground_truth": 0}, {"key": "f12e4bbb07211de7d43b4e331dc73404aa804562", "model": "xsum_2_ft_llama", "target_model": "claude", "recognition_score": 0.9732407153099019, "ground_truth": 0}, {"key": "f12e4bbb07211de7d43b4e331dc73404aa804562", "model": "xsum_2_ft_llama", "target_model": "gpt4", "recognition_score": 0.9563089363595498, "ground_truth": 0}, {"key": "f12e4bbb07211de7d43b4e331dc73404aa804562", "model": "xsum_2_ft_llama", "target_model": "gpt35", "recognition_score": 0.9907319871527921, "ground_truth": 0}]