[{"key": "42c027e4ff9730fbb3de84c1af0d2c506e41c3e4", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.6132365745166363, "ground_truth": 0}, {"key": "42c027e4ff9730fbb3de84c1af0d2c506e41c3e4", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.6808786262005191, "ground_truth": 0}, {"key": "42c027e4ff9730fbb3de84c1af0d2c506e41c3e4", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.5506073562336617, "ground_truth": 0}, {"key": "42c027e4ff9730fbb3de84c1af0d2c506e41c3e4", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.577495344909341, "ground_truth": 0}, {"key": "42c027e4ff9730fbb3de84c1af0d2c506e41c3e4", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.7969253693359167, "ground_truth": 0}, {"key": "ee8871b15c50d0db17b0179a6d2beab35065f1e9", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.6740504599309028, "ground_truth": 0}, {"key": "ee8871b15c50d0db17b0179a6d2beab35065f1e9", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.32423540507965826, "ground_truth": 0}, {"key": "ee8871b15c50d0db17b0179a6d2beab35065f1e9", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.3208213069019304, "ground_truth": 0}, {"key": "ee8871b15c50d0db17b0179a6d2beab35065f1e9", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.4054487214278093, "ground_truth": 0}, {"key": "ee8871b15c50d0db17b0179a6d2beab35065f1e9", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.6187804347928033, "ground_truth": 0}, {"key": "06352019a19ae31e527f37f7571c6dd7f0c5da37", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.3504213739932541, "ground_truth": 0}, {"key": "06352019a19ae31e527f37f7571c6dd7f0c5da37", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.49023561675195715, "ground_truth": 0}, {"key": "06352019a19ae31e527f37f7571c6dd7f0c5da37", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.4054487293444783, "ground_truth": 0}, {"key": "06352019a19ae31e527f37f7571c6dd7f0c5da37", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.15002882299689685, "ground_truth": 0}, {"key": "06352019a19ae31e527f37f7571c6dd7f0c5da37", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.2658804653645944, "ground_truth": 0}, {"key": "24521a2abb2e1f5e34e6824e0f9e56904a2b0e88", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.8577681074800405, "ground_truth": 0}, {"key": "24521a2abb2e1f5e34e6824e0f9e56904a2b0e88", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.9241418170796608, "ground_truth": 0}, {"key": "24521a2abb2e1f5e34e6824e0f9e56904a2b0e88", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.8816149123311464, "ground_truth": 0}, {"key": "24521a2abb2e1f5e34e6824e0f9e56904a2b0e88", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.7520125582218261, "ground_truth": 0}, {"key": "24521a2abb2e1f5e34e6824e0f9e56904a2b0e88", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.9511422229445461, "ground_truth": 0}, {"key": "7fe70cc8b12fab2d0a258fababf7d9c6b5e1262a", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.6076631699850407, "ground_truth": 0}, {"key": "7fe70cc8b12fab2d0a258fababf7d9c6b5e1262a", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.8633915960925614, "ground_truth": 0}, {"key": "7fe70cc8b12fab2d0a258fababf7d9c6b5e1262a", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.6859494615980101, "ground_truth": 0}, {"key": "7fe70cc8b12fab2d0a258fababf7d9c6b5e1262a", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.7839884628960735, "ground_truth": 0}, {"key": "7fe70cc8b12fab2d0a258fababf7d9c6b5e1262a", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.8418256495323243, "ground_truth": 0}, {"key": "a1ebb8bb4d370a1fdf28769206d572be60642d70", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.8354835389317883, "ground_truth": 0}, {"key": "a1ebb8bb4d370a1fdf28769206d572be60642d70", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.5409238815158344, "ground_truth": 0}, {"key": "a1ebb8bb4d370a1fdf28769206d572be60642d70", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.8365545676948161, "ground_truth": 0}, {"key": "a1ebb8bb4d370a1fdf28769206d572be60642d70", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.715424002940337, "ground_truth": 0}, {"key": "a1ebb8bb4d370a1fdf28769206d572be60642d70", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.6688802722436803, "ground_truth": 0}, {"key": "7c0e61ac829a3b3b653e2e3e7536cc4881d1f264", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.2133771718599202, "ground_truth": 0}, {"key": "7c0e61ac829a3b3b653e2e3e7536cc4881d1f264", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.3363310344356684, "ground_truth": 0}, {"key": "7c0e61ac829a3b3b653e2e3e7536cc4881d1f264", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.22405546411188937, "ground_truth": 0}, {"key": "7c0e61ac829a3b3b653e2e3e7536cc4881d1f264", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.4359015437088064, "ground_truth": 0}, {"key": "7c0e61ac829a3b3b653e2e3e7536cc4881d1f264", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.361164732180357, "ground_truth": 0}, {"key": "f0d73bdab711763e745cdc75850861c9018f235d", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.8688267761728693, "ground_truth": 0}, {"key": "f0d73bdab711763e745cdc75850861c9018f235d", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.7520125898770091, "ground_truth": 0}, {"key": "f0d73bdab711763e745cdc75850861c9018f235d", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.560252656051247, "ground_truth": 0}, {"key": "f0d73bdab711763e745cdc75850861c9018f235d", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.6619228739019632, "ground_truth": 0}, {"key": "f0d73bdab711763e745cdc75850861c9018f235d", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.5926666070558986, "ground_truth": 0}, {"key": "5e22bbfc7232418b8d2dd646b952e404df5bd048", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.8955226789428975, "ground_truth": 0}, {"key": "5e22bbfc7232418b8d2dd646b952e404df5bd048", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.7170118665140718, "ground_truth": 0}, {"key": "5e22bbfc7232418b8d2dd646b952e404df5bd048", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.833324596296792, "ground_truth": 0}, {"key": "5e22bbfc7232418b8d2dd646b952e404df5bd048", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.7745833826360217, "ground_truth": 0}, {"key": "5e22bbfc7232418b8d2dd646b952e404df5bd048", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.9543079654432693, "ground_truth": 0}, {"key": "613d6311ec2c1985bd44707d1796d275452fe156", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.5813031085289458, "ground_truth": 0}, {"key": "613d6311ec2c1985bd44707d1796d275452fe156", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.7853085978521789, "ground_truth": 0}, {"key": "613d6311ec2c1985bd44707d1796d275452fe156", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.7025300437685671, "ground_truth": 0}, {"key": "613d6311ec2c1985bd44707d1796d275452fe156", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.4726834923503813, "ground_truth": 0}, {"key": "613d6311ec2c1985bd44707d1796d275452fe156", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.5851011276997743, "ground_truth": 0}, {"key": "017d27d00eb43678c15cb4a8dd4723a035323219", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.48633153169604604, "ground_truth": 0}, {"key": "017d27d00eb43678c15cb4a8dd4723a035323219", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.36116472337434774, "ground_truth": 0}, {"key": "017d27d00eb43678c15cb4a8dd4723a035323219", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.4687906164300422, "ground_truth": 0}, {"key": "017d27d00eb43678c15cb4a8dd4723a035323219", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.5717666003161102, "ground_truth": 0}, {"key": "017d27d00eb43678c15cb4a8dd4723a035323219", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.5774953773572491, "ground_truth": 0}, {"key": "85f55a3e0dd672857aaaaa80954934a57b7a2fbf", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.7866228341402923, "ground_truth": 0}, {"key": "85f55a3e0dd672857aaaaa80954934a57b7a2fbf", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.6113819687679762, "ground_truth": 0}, {"key": "85f55a3e0dd672857aaaaa80954934a57b7a2fbf", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.779992905079811, "ground_truth": 0}, {"key": "85f55a3e0dd672857aaaaa80954934a57b7a2fbf", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.6774740145949704, "ground_truth": 0}, {"key": "85f55a3e0dd672857aaaaa80954934a57b7a2fbf", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.3738758396566441, "ground_truth": 0}, {"key": "77d7c8cf2a9432e395d629371a12790c563c19f7", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.8244619257408548, "ground_truth": 0}, {"key": "77d7c8cf2a9432e395d629371a12790c563c19f7", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.8856314716821456, "ground_truth": 0}, {"key": "77d7c8cf2a9432e395d629371a12790c563c19f7", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.7931059669361615, "ground_truth": 0}, {"key": "77d7c8cf2a9432e395d629371a12790c563c19f7", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.6297746003328216, "ground_truth": 0}, {"key": "77d7c8cf2a9432e395d629371a12790c563c19f7", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.9381240154414485, "ground_truth": 0}, {"key": "35f0e33de7923036a97ac245d899f990bda5e242", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.8418256481369246, "ground_truth": 0}, {"key": "35f0e33de7923036a97ac245d899f990bda5e242", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.7690802483918452, "ground_truth": 0}, {"key": "35f0e33de7923036a97ac245d899f990bda5e242", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.7892336864936829, "ground_truth": 0}, {"key": "35f0e33de7923036a97ac245d899f990bda5e242", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.9079671456180856, "ground_truth": 0}, {"key": "35f0e33de7923036a97ac245d899f990bda5e242", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.7476159497469146, "ground_truth": 0}, {"key": "2ad31cae96512af5105b9b23f9b681dc732b2605", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.7563575682089956, "ground_truth": 0}, {"key": "2ad31cae96512af5105b9b23f9b681dc732b2605", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.7217432321706182, "ground_truth": 0}, {"key": "2ad31cae96512af5105b9b23f9b681dc732b2605", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.782662483601188, "ground_truth": 0}, {"key": "2ad31cae96512af5105b9b23f9b681dc732b2605", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.8322366586699969, "ground_truth": 0}, {"key": "2ad31cae96512af5105b9b23f9b681dc732b2605", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.8244619289687077, "ground_truth": 0}, {"key": "0d43b97000ff852282c89d8d105e41495c0ee9bd", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.6859494525153399, "ground_truth": 0}, {"key": "0d43b97000ff852282c89d8d105e41495c0ee9bd", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.5851011650016351, "ground_truth": 0}, {"key": "0d43b97000ff852282c89d8d105e41495c0ee9bd", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.46295862434848073, "ground_truth": 0}, {"key": "0d43b97000ff852282c89d8d105e41495c0ee9bd", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.7310585483870358, "ground_truth": 0}, {"key": "0d43b97000ff852282c89d8d105e41495c0ee9bd", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.8300437701898921, "ground_truth": 0}, {"key": "bf0cd4ccacd4fe045995338f4c44d9cf18000226", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.85096471645699, "ground_truth": 0}, {"key": "bf0cd4ccacd4fe045995338f4c44d9cf18000226", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.7813306359044301, "ground_truth": 0}, {"key": "bf0cd4ccacd4fe045995338f4c44d9cf18000226", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.7826624762505857, "ground_truth": 0}, {"key": "bf0cd4ccacd4fe045995338f4c44d9cf18000226", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.7994423290891938, "ground_truth": 0}, {"key": "bf0cd4ccacd4fe045995338f4c44d9cf18000226", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.7185943910105663, "ground_truth": 0}, {"key": "2f43e9dfaa43ffbddbce339a8b6403ddce43b38a", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.2845759952618285, "ground_truth": 0}, {"key": "2f43e9dfaa43ffbddbce339a8b6403ddce43b38a", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.6774740015678464, "ground_truth": 0}, {"key": "2f43e9dfaa43ffbddbce339a8b6403ddce43b38a", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.6352224282410748, "ground_truth": 0}, {"key": "2f43e9dfaa43ffbddbce339a8b6403ddce43b38a", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.6584174984618739, "ground_truth": 0}, {"key": "2f43e9dfaa43ffbddbce339a8b6403ddce43b38a", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.4474602803175854, "ground_truth": 0}, {"key": "eb68bc51ed4fc727a1af058192a3fef0916c91e7", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.5097643952330693, "ground_truth": 0}, {"key": "eb68bc51ed4fc727a1af058192a3fef0916c91e7", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.49609382631053794, "ground_truth": 0}, {"key": "eb68bc51ed4fc727a1af058192a3fef0916c91e7", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.6113819749448782, "ground_truth": 0}, {"key": "eb68bc51ed4fc727a1af058192a3fef0916c91e7", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.3979384227541123, "ground_truth": 0}, {"key": "eb68bc51ed4fc727a1af058192a3fef0916c91e7", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.4397473326832813, "ground_truth": 0}, {"key": "ad021a7924ee57491cee8576499ac196b1afeb23", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.674050468490734, "ground_truth": 0}, {"key": "ad021a7924ee57491cee8576499ac196b1afeb23", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.7446563473418103, "ground_truth": 0}, {"key": "ad021a7924ee57491cee8576499ac196b1afeb23", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.8397339760764142, "ground_truth": 0}, {"key": "ad021a7924ee57491cee8576499ac196b1afeb23", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.8006919944532412, "ground_truth": 0}, {"key": "ad021a7924ee57491cee8576499ac196b1afeb23", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.7772998574272382, "ground_truth": 0}, {"key": "9d7fc7fd9ffbfecb1c458b9929fa02e6c3538368", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.6224593286273714, "ground_truth": 0}, {"key": "9d7fc7fd9ffbfecb1c458b9929fa02e6c3538368", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.6774740159187954, "ground_truth": 0}, {"key": "9d7fc7fd9ffbfecb1c458b9929fa02e6c3538368", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.5926665959527403, "ground_truth": 0}, {"key": "9d7fc7fd9ffbfecb1c458b9929fa02e6c3538368", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.6224593418984108, "ground_truth": 0}, {"key": "9d7fc7fd9ffbfecb1c458b9929fa02e6c3538368", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.6150878400346904, "ground_truth": 0}, {"key": "30cb674030b01014d2c87b92f09152857e249631", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.7476159374327954, "ground_truth": 0}, {"key": "30cb674030b01014d2c87b92f09152857e249631", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.6279512268597506, "ground_truth": 0}, {"key": "30cb674030b01014d2c87b92f09152857e249631", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.6460136887874464, "ground_truth": 0}, {"key": "30cb674030b01014d2c87b92f09152857e249631", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.5448014011643241, "ground_truth": 0}, {"key": "30cb674030b01014d2c87b92f09152857e249631", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.8092759594937319, "ground_truth": 0}, {"key": "d41dc7fc05273a37f0aceaf4f3e35a187f12653e", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.5945512726894467, "ground_truth": 0}, {"key": "d41dc7fc05273a37f0aceaf4f3e35a187f12653e", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.332852338161184, "ground_truth": 0}, {"key": "d41dc7fc05273a37f0aceaf4f3e35a187f12653e", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.5813030816258543, "ground_truth": 0}, {"key": "d41dc7fc05273a37f0aceaf4f3e35a187f12653e", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.6132365580839366, "ground_truth": 0}, {"key": "d41dc7fc05273a37f0aceaf4f3e35a187f12653e", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.6132365355877493, "ground_truth": 0}, {"key": "fbc6a4d0697b2a3e8b549dcb1f80a8ce7bf47e34", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.879146765679993, "ground_truth": 0}, {"key": "fbc6a4d0697b2a3e8b549dcb1f80a8ce7bf47e34", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.9294404051004869, "ground_truth": 0}, {"key": "fbc6a4d0697b2a3e8b549dcb1f80a8ce7bf47e34", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.818736780664159, "ground_truth": 0}, {"key": "fbc6a4d0697b2a3e8b549dcb1f80a8ce7bf47e34", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.8740772452057195, "ground_truth": 0}, {"key": "fbc6a4d0697b2a3e8b549dcb1f80a8ce7bf47e34", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.9012274231887152, "ground_truth": 0}, {"key": "0753a471e6908c35bcbc2daa37e21f3a8443b590", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.8705972723297738, "ground_truth": 0}, {"key": "0753a471e6908c35bcbc2daa37e21f3a8443b590", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.8233284024759793, "ground_truth": 0}, {"key": "0753a471e6908c35bcbc2daa37e21f3a8443b590", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.8333246030963237, "ground_truth": 0}, {"key": "0753a471e6908c35bcbc2daa37e21f3a8443b590", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.7549149741250928, "ground_truth": 0}, {"key": "0753a471e6908c35bcbc2daa37e21f3a8443b590", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.6909762824488059, "ground_truth": 0}, {"key": "08450c1bc03472825196be1acb02ac0e13bef939", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.3157359808710935, "ground_truth": 0}, {"key": "08450c1bc03472825196be1acb02ac0e13bef939", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.5945512708907207, "ground_truth": 0}, {"key": "08450c1bc03472825196be1acb02ac0e13bef939", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.4282333991996413, "ground_truth": 0}, {"key": "08450c1bc03472825196be1acb02ac0e13bef939", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.8210440978895306, "ground_truth": 0}, {"key": "08450c1bc03472825196be1acb02ac0e13bef939", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.6406358391421871, "ground_truth": 0}, {"key": "7fa8d9beca50155fd3d71a9087a4311ce321c34b", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.7041601384338677, "ground_truth": 0}, {"key": "7fa8d9beca50155fd3d71a9087a4311ce321c34b", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.5117165915219081, "ground_truth": 0}, {"key": "7fa8d9beca50155fd3d71a9087a4311ce321c34b", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.6477982483429167, "ground_truth": 0}, {"key": "7fa8d9beca50155fd3d71a9087a4311ce321c34b", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.9278877959091563, "ground_truth": 0}, {"key": "7fa8d9beca50155fd3d71a9087a4311ce321c34b", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.4824291288601696, "ground_truth": 0}, {"key": "414a5b8ecbe189d2767c75b839775a1dcafaf4d3", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.49804690138207935, "ground_truth": 0}, {"key": "414a5b8ecbe189d2767c75b839775a1dcafaf4d3", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.2628418597331023, "ground_truth": 0}, {"key": "414a5b8ecbe189d2767c75b839775a1dcafaf4d3", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.5851011647159401, "ground_truth": 0}, {"key": "414a5b8ecbe189d2767c75b839775a1dcafaf4d3", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.23231014041537862, "ground_truth": 0}, {"key": "414a5b8ecbe189d2767c75b839775a1dcafaf4d3", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.4378234818454508, "ground_truth": 0}, {"key": "cac7a712935380d74410a7cba8d406235d51249a", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.7122321819671723, "ground_truth": 0}, {"key": "cac7a712935380d74410a7cba8d406235d51249a", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.5389832235892215, "ground_truth": 0}, {"key": "cac7a712935380d74410a7cba8d406235d51249a", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.5832033495160263, "ground_truth": 0}, {"key": "cac7a712935380d74410a7cba8d406235d51249a", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.6601723794606634, "ground_truth": 0}, {"key": "cac7a712935380d74410a7cba8d406235d51249a", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.5136684781562703, "ground_truth": 0}, {"key": "e9093ca0a82f2aba28cd2762942c04177cfbb000", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.7401743818189364, "ground_truth": 0}, {"key": "e9093ca0a82f2aba28cd2762942c04177cfbb000", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.8418256495751867, "ground_truth": 0}, {"key": "e9093ca0a82f2aba28cd2762942c04177cfbb000", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.5350984128764407, "ground_truth": 0}, {"key": "e9093ca0a82f2aba28cd2762942c04177cfbb000", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.7853085852732787, "ground_truth": 0}, {"key": "e9093ca0a82f2aba28cd2762942c04177cfbb000", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.6406358762843756, "ground_truth": 0}, {"key": "55a6aabd120f0b18297f7efe22452f9b3aca0d8d", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.9219218353419439, "ground_truth": 0}, {"key": "55a6aabd120f0b18297f7efe22452f9b3aca0d8d", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.9761291663722006, "ground_truth": 0}, {"key": "55a6aabd120f0b18297f7efe22452f9b3aca0d8d", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.9111797109955984, "ground_truth": 0}, {"key": "55a6aabd120f0b18297f7efe22452f9b3aca0d8d", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.9621075746601242, "ground_truth": 0}, {"key": "55a6aabd120f0b18297f7efe22452f9b3aca0d8d", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.9825575164501216, "ground_truth": 0}, {"key": "06bc2f0272d033b123e9eebbb221c62d7d51c283", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.3923368366108375, "ground_truth": 0}, {"key": "06bc2f0272d033b123e9eebbb221c62d7d51c283", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.39420093529363565, "ground_truth": 0}, {"key": "06bc2f0272d033b123e9eebbb221c62d7d51c283", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.2240554580456652, "ground_truth": 0}, {"key": "06bc2f0272d033b123e9eebbb221c62d7d51c283", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.18010666953304644, "ground_truth": 0}, {"key": "06bc2f0272d033b123e9eebbb221c62d7d51c283", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.6001883440826667, "ground_truth": 0}, {"key": "17e43e8e7d2bbbb237df78537d108c3fa917d9fb", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.9942250701710067, "ground_truth": 0}, {"key": "17e43e8e7d2bbbb237df78537d108c3fa917d9fb", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.9948202866637477, "ground_truth": 0}, {"key": "17e43e8e7d2bbbb237df78537d108c3fa917d9fb", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.9862576791757195, "ground_truth": 0}, {"key": "17e43e8e7d2bbbb237df78537d108c3fa917d9fb", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.9880389007604727, "ground_truth": 0}, {"key": "17e43e8e7d2bbbb237df78537d108c3fa917d9fb", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.9895916864621266, "ground_truth": 0}, {"key": "ddcdeb9bdd19fa23f9495c85d48eeee910f33102", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.6495786340988908, "ground_truth": 0}, {"key": "ddcdeb9bdd19fa23f9495c85d48eeee910f33102", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.876634386723724, "ground_truth": 0}, {"key": "ddcdeb9bdd19fa23f9495c85d48eeee910f33102", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.7866228276781838, "ground_truth": 0}, {"key": "ddcdeb9bdd19fa23f9495c85d48eeee910f33102", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.5156199271658963, "ground_truth": 0}, {"key": "ddcdeb9bdd19fa23f9495c85d48eeee910f33102", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.5679366099532585, "ground_truth": 0}, {"key": "ee0ba7928d8987f2cb21c9a2012a76730f77de45", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.5214711599156071, "ground_truth": 0}, {"key": "ee0ba7928d8987f2cb21c9a2012a76730f77de45", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.6261242102072524, "ground_truth": 0}, {"key": "ee0ba7928d8987f2cb21c9a2012a76730f77de45", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.4436004389689966, "ground_truth": 0}, {"key": "ee0ba7928d8987f2cb21c9a2012a76730f77de45", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.3433417200353045, "ground_truth": 0}, {"key": "ee0ba7928d8987f2cb21c9a2012a76730f77de45", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.47268347562291346, "ground_truth": 0}, {"key": "554fd99f28ae12472c5d99ef6383bb184744c25a", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.6808786232497037, "ground_truth": 0}, {"key": "554fd99f28ae12472c5d99ef6383bb184744c25a", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.4941409057512429, "ground_truth": 0}, {"key": "554fd99f28ae12472c5d99ef6383bb184744c25a", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.43014734409984673, "ground_truth": 0}, {"key": "554fd99f28ae12472c5d99ef6383bb184744c25a", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.7185944055200486, "ground_truth": 0}, {"key": "554fd99f28ae12472c5d99ef6383bb184744c25a", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.592666606486486, "ground_truth": 0}, {"key": "9e141ebc1c06d483bf85f4e5c8b3c7bc2d00ea2f", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.6224593244523347, "ground_truth": 0}, {"key": "9e141ebc1c06d483bf85f4e5c8b3c7bc2d00ea2f", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.48242911579365727, "ground_truth": 0}, {"key": "9e141ebc1c06d483bf85f4e5c8b3c7bc2d00ea2f", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.2877678082260125, "ground_truth": 0}, {"key": "9e141ebc1c06d483bf85f4e5c8b3c7bc2d00ea2f", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.5907791901140249, "ground_truth": 0}, {"key": "9e141ebc1c06d483bf85f4e5c8b3c7bc2d00ea2f", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.4282333766664668, "ground_truth": 0}, {"key": "c9160e2f5ce386dabb10517e7a5c0933c01a9546", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.6671476615214668, "ground_truth": 0}, {"key": "c9160e2f5ce386dabb10517e7a5c0933c01a9546", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.5448014090941934, "ground_truth": 0}, {"key": "c9160e2f5ce386dabb10517e7a5c0933c01a9546", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.3575675217354522, "ground_truth": 0}, {"key": "c9160e2f5ce386dabb10517e7a5c0933c01a9546", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.37570647612580604, "ground_truth": 0}, {"key": "c9160e2f5ce386dabb10517e7a5c0933c01a9546", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.41300357324996306, "ground_truth": 0}, {"key": "d256aee1a47eb5b489dee6fb72ab7f7d1483a37f", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.31573598916277895, "ground_truth": 0}, {"key": "d256aee1a47eb5b489dee6fb72ab7f7d1483a37f", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.3468730793183591, "ground_truth": 0}, {"key": "d256aee1a47eb5b489dee6fb72ab7f7d1483a37f", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.30902371348435326, "ground_truth": 0}, {"key": "d256aee1a47eb5b489dee6fb72ab7f7d1483a37f", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.4551986183178134, "ground_truth": 0}, {"key": "d256aee1a47eb5b489dee6fb72ab7f7d1483a37f", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.3665897339551186, "ground_truth": 0}, {"key": "2fff2bc541ef34a6647dfa2e4294cdcc187e47b9", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.4941409085674787, "ground_truth": 0}, {"key": "2fff2bc541ef34a6647dfa2e4294cdcc187e47b9", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.6334102564401259, "ground_truth": 0}, {"key": "2fff2bc541ef34a6647dfa2e4294cdcc187e47b9", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.38676346348524265, "ground_truth": 0}, {"key": "2fff2bc541ef34a6647dfa2e4294cdcc187e47b9", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.5136684781852535, "ground_truth": 0}, {"key": "2fff2bc541ef34a6647dfa2e4294cdcc187e47b9", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.6688802615695811, "ground_truth": 0}, {"key": "677375a4c69e81ab623af7c06a6b0a8d03d6350e", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.31573597849306434, "ground_truth": 0}, {"key": "677375a4c69e81ab623af7c06a6b0a8d03d6350e", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.3174262742646319, "ground_truth": 0}, {"key": "677375a4c69e81ab623af7c06a6b0a8d03d6350e", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.3208213158079252, "ground_truth": 0}, {"key": "677375a4c69e81ab623af7c06a6b0a8d03d6350e", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.3174262914459734, "ground_truth": 0}, {"key": "677375a4c69e81ab623af7c06a6b0a8d03d6350e", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.24653334503451593, "ground_truth": 0}, {"key": "33530f97118cc905b05cb920671492c7bfdf3a3b", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.7217432320972128, "ground_truth": 0}, {"key": "33530f97118cc905b05cb920671492c7bfdf3a3b", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.6976089094162179, "ground_truth": 0}, {"key": "33530f97118cc905b05cb920671492c7bfdf3a3b", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.663668966515422, "ground_truth": 0}, {"key": "33530f97118cc905b05cb920671492c7bfdf3a3b", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.7310585820531831, "ground_truth": 0}, {"key": "33530f97118cc905b05cb920671492c7bfdf3a3b", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.5506073902351609, "ground_truth": 0}, {"key": "3c19a753303ae0d67b3ae28e070c0f4157ffc52d", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.6757645827746397, "ground_truth": 0}, {"key": "3c19a753303ae0d67b3ae28e070c0f4157ffc52d", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.651354877721462, "ground_truth": 0}, {"key": "3c19a753303ae0d67b3ae28e070c0f4157ffc52d", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.7905303369395441, "ground_truth": 0}, {"key": "3c19a753303ae0d67b3ae28e070c0f4157ffc52d", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.6513548996928606, "ground_truth": 0}, {"key": "3c19a753303ae0d67b3ae28e070c0f4157ffc52d", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.6740504702460222, "ground_truth": 0}, {"key": "9313988d26672c576f08e130c895edf20d8aa626", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.7201714870515299, "ground_truth": 0}, {"key": "9313988d26672c576f08e130c895edf20d8aa626", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.6279512019820103, "ground_truth": 0}, {"key": "9313988d26672c576f08e130c895edf20d8aa626", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.6740504726713065, "ground_truth": 0}, {"key": "9313988d26672c576f08e130c895edf20d8aa626", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.6261241876722072, "ground_truth": 0}, {"key": "9313988d26672c576f08e130c895edf20d8aa626", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.5794004071694137, "ground_truth": 0}, {"key": "72f4a6670ec7ec915c83d58bb0ebf152b1605bb6", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.8940517144663855, "ground_truth": 0}, {"key": "72f4a6670ec7ec915c83d58bb0ebf152b1605bb6", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.9385759642275775, "ground_truth": 0}, {"key": "72f4a6670ec7ec915c83d58bb0ebf152b1605bb6", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.9309620719103349, "ground_truth": 0}, {"key": "72f4a6670ec7ec915c83d58bb0ebf152b1605bb6", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.8723473794050611, "ground_truth": 0}, {"key": "72f4a6670ec7ec915c83d58bb0ebf152b1605bb6", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.9309620739067934, "ground_truth": 0}, {"key": "b73f50e29d5b2943eb315643bef8ee4e09f5605b", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.3830641730934683, "ground_truth": 0}, {"key": "b73f50e29d5b2943eb315643bef8ee4e09f5605b", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.14318770477446074, "ground_truth": 0}, {"key": "b73f50e29d5b2943eb315643bef8ee4e09f5605b", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.16559311881558317, "ground_truth": 0}, {"key": "b73f50e29d5b2943eb315643bef8ee4e09f5605b", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.40733341022685593, "ground_truth": 0}, {"key": "b73f50e29d5b2943eb315643bef8ee4e09f5605b", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.27048023322402226, "ground_truth": 0}, {"key": "f9689fb9656132e1c6d186851563f2b968643791", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.2043418987438866, "ground_truth": 0}, {"key": "f9689fb9656132e1c6d186851563f2b968643791", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.37022539257478093, "ground_truth": 0}, {"key": "f9689fb9656132e1c6d186851563f2b968643791", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.149035293545836, "ground_truth": 0}, {"key": "f9689fb9656132e1c6d186851563f2b968643791", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.3867634245330227, "ground_truth": 0}, {"key": "f9689fb9656132e1c6d186851563f2b968643791", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.33285233536225406, "ground_truth": 0}, {"key": "63831b842812b1a3d05b04904a10d160fe7ad2af", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.8031737892259216, "ground_truth": 0}, {"key": "63831b842812b1a3d05b04904a10d160fe7ad2af", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.8019358219882388, "ground_truth": 0}, {"key": "63831b842812b1a3d05b04904a10d160fe7ad2af", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.8044059269428973, "ground_truth": 0}, {"key": "63831b842812b1a3d05b04904a10d160fe7ad2af", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.8529354716206395, "ground_truth": 0}, {"key": "63831b842812b1a3d05b04904a10d160fe7ad2af", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.6791786977115034, "ground_truth": 0}, {"key": "05688bac0e46542be65a6df240428a6f26c86fd0", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.90122741227119, "ground_truth": 0}, {"key": "05688bac0e46542be65a6df240428a6f26c86fd0", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.9273632931032612, "ground_truth": 0}, {"key": "05688bac0e46542be65a6df240428a6f26c86fd0", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.9167080735633939, "ground_truth": 0}, {"key": "05688bac0e46542be65a6df240428a6f26c86fd0", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.9230391597888924, "ground_truth": 0}, {"key": "05688bac0e46542be65a6df240428a6f26c86fd0", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.9704646623254425, "ground_truth": 0}, {"key": "5ba0d22ccba29ac8a3c77da069165d6016f5a214", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.46879061203795847, "ground_truth": 0}, {"key": "5ba0d22ccba29ac8a3c77da069165d6016f5a214", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.5945512839724095, "ground_truth": 0}, {"key": "5ba0d22ccba29ac8a3c77da069165d6016f5a214", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.36296918561468017, "ground_truth": 0}, {"key": "5ba0d22ccba29ac8a3c77da069165d6016f5a214", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.22135069032241655, "ground_truth": 0}, {"key": "5ba0d22ccba29ac8a3c77da069165d6016f5a214", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.38676345761685954, "ground_truth": 0}, {"key": "9f63d6256158d260c426a9336d19b760d9bc5a48", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.49414087856627215, "ground_truth": 0}, {"key": "9f63d6256158d260c426a9336d19b760d9bc5a48", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.409220782791498, "ground_truth": 0}, {"key": "9f63d6256158d260c426a9336d19b760d9bc5a48", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.46101678235165977, "ground_truth": 0}, {"key": "9f63d6256158d260c426a9336d19b760d9bc5a48", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.4416730283074569, "ground_truth": 0}, {"key": "9f63d6256158d260c426a9336d19b760d9bc5a48", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.5097643922605439, "ground_truth": 0}, {"key": "fb6516de631cade629b797e8f40f377523c4aa0e", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.7549149962991373, "ground_truth": 0}, {"key": "fb6516de631cade629b797e8f40f377523c4aa0e", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.72642560645391, "ground_truth": 0}, {"key": "fb6516de631cade629b797e8f40f377523c4aa0e", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.8879840607866258, "ground_truth": 0}, {"key": "fb6516de631cade629b797e8f40f377523c4aa0e", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.5544704558894715, "ground_truth": 0}, {"key": "fb6516de631cade629b797e8f40f377523c4aa0e", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.8128673174027077, "ground_truth": 0}, {"key": "0a71f063b78184b4ca2ffee3c642d48dc27ef91b", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.4339814561529715, "ground_truth": 0}, {"key": "0a71f063b78184b4ca2ffee3c642d48dc27ef91b", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.4339814493005788, "ground_truth": 0}, {"key": "0a71f063b78184b4ca2ffee3c642d48dc27ef91b", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.4687906272717818, "ground_truth": 0}, {"key": "0a71f063b78184b4ca2ffee3c642d48dc27ef91b", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.33633104057130475, "ground_truth": 0}, {"key": "0a71f063b78184b4ca2ffee3c642d48dc27ef91b", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.4073334009474429, "ground_truth": 0}, {"key": "700e0d133d2f5c2e65960aae7bffa66bb62c0df4", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.6992544238559217, "ground_truth": 0}, {"key": "700e0d133d2f5c2e65960aae7bffa66bb62c0df4", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.5660185625062502, "ground_truth": 0}, {"key": "700e0d133d2f5c2e65960aae7bffa66bb62c0df4", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.5736784096559603, "ground_truth": 0}, {"key": "700e0d133d2f5c2e65960aae7bffa66bb62c0df4", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.7732163469604251, "ground_truth": 0}, {"key": "700e0d133d2f5c2e65960aae7bffa66bb62c0df4", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.5097643805110592, "ground_truth": 0}, {"key": "180642a2ddfce93ceaf3ee3ec4779400fe67ae1e", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.7310585989811348, "ground_truth": 0}, {"key": "180642a2ddfce93ceaf3ee3ec4779400fe67ae1e", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.583203328980963, "ground_truth": 0}, {"key": "180642a2ddfce93ceaf3ee3ec4779400fe67ae1e", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.7759445584485194, "ground_truth": 0}, {"key": "180642a2ddfce93ceaf3ee3ec4779400fe67ae1e", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.6601723779656993, "ground_truth": 0}, {"key": "180642a2ddfce93ceaf3ee3ec4779400fe67ae1e", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.7534666709876537, "ground_truth": 0}, {"key": "3e868fbad714ceab14a41fa9dd5d8a40204f2199", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.7786493145645658, "ground_truth": 0}, {"key": "3e868fbad714ceab14a41fa9dd5d8a40204f2199", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.2281565131643229, "ground_truth": 0}, {"key": "3e868fbad714ceab14a41fa9dd5d8a40204f2199", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.4785288106592434, "ground_truth": 0}, {"key": "3e868fbad714ceab14a41fa9dd5d8a40204f2199", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.6297745850780921, "ground_truth": 0}, {"key": "3e868fbad714ceab14a41fa9dd5d8a40204f2199", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.6279511924030335, "ground_truth": 0}, {"key": "8b0a818edcbbefb79dd40a19b08119f6848083db", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.7310585668973608, "ground_truth": 0}, {"key": "8b0a818edcbbefb79dd40a19b08119f6848083db", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.409220782791498, "ground_truth": 0}, {"key": "8b0a818edcbbefb79dd40a19b08119f6848083db", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.3259495192352083, "ground_truth": 0}, {"key": "8b0a818edcbbefb79dd40a19b08119f6848083db", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.3998116442838416, "ground_truth": 0}, {"key": "8b0a818edcbbefb79dd40a19b08119f6848083db", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.43398148475797216, "ground_truth": 0}, {"key": "ceb7a288ac1ad604a17bc25c5978fcc87b1a4446", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.6926419890499071, "ground_truth": 0}, {"key": "ceb7a288ac1ad604a17bc25c5978fcc87b1a4446", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.49218811830133713, "ground_truth": 0}, {"key": "ceb7a288ac1ad604a17bc25c5978fcc87b1a4446", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.7606506714475152, "ground_truth": 0}, {"key": "ceb7a288ac1ad604a17bc25c5978fcc87b1a4446", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.5019530884253471, "ground_truth": 0}, {"key": "ceb7a288ac1ad604a17bc25c5978fcc87b1a4446", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.6808786147201628, "ground_truth": 0}, {"key": "a228e744966fe03eca515b971329acacf9feabb2", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.5428632727540396, "ground_truth": 0}, {"key": "a228e744966fe03eca515b971329acacf9feabb2", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.7371581598784961, "ground_truth": 0}, {"key": "a228e744966fe03eca515b971329acacf9feabb2", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.7943849594562237, "ground_truth": 0}, {"key": "a228e744966fe03eca515b971329acacf9feabb2", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.723309471014942, "ground_truth": 0}, {"key": "a228e744966fe03eca515b971329acacf9feabb2", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.7505527667472277, "ground_truth": 0}, {"key": "c44238ec87e7fc40ab7fe6e724cfcbf301e01216", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.7154239900806608, "ground_truth": 0}, {"key": "c44238ec87e7fc40ab7fe6e724cfcbf301e01216", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.7577943824735034, "ground_truth": 0}, {"key": "c44238ec87e7fc40ab7fe6e724cfcbf301e01216", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.5136684715787759, "ground_truth": 0}, {"key": "c44238ec87e7fc40ab7fe6e724cfcbf301e01216", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.6477982267075212, "ground_truth": 0}, {"key": "c44238ec87e7fc40ab7fe6e724cfcbf301e01216", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.7025300452182317, "ground_truth": 0}, {"key": "fff32094b00f3780cc98fe43bd98aace4b851281", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.6460136982619624, "ground_truth": 0}, {"key": "fff32094b00f3780cc98fe43bd98aace4b851281", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.7662936533268996, "ground_truth": 0}, {"key": "fff32094b00f3780cc98fe43bd98aace4b851281", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.6825737276915728, "ground_truth": 0}, {"key": "fff32094b00f3780cc98fe43bd98aace4b851281", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.7386690890226465, "ground_truth": 0}, {"key": "fff32094b00f3780cc98fe43bd98aace4b851281", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.8344068908727, "ground_truth": 0}, {"key": "373ef5be1d84b8c4905193e569e0cf8a7ead3d03", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.5331543962044677, "ground_truth": 0}, {"key": "373ef5be1d84b8c4905193e569e0cf8a7ead3d03", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.43398146686044425, "ground_truth": 0}, {"key": "373ef5be1d84b8c4905193e569e0cf8a7ead3d03", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.7057850223371728, "ground_truth": 0}, {"key": "373ef5be1d84b8c4905193e569e0cf8a7ead3d03", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.5506073346205861, "ground_truth": 0}, {"key": "373ef5be1d84b8c4905193e569e0cf8a7ead3d03", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.4092207922389077, "ground_truth": 0}, {"key": "f372b28e3d1f74d60aa8ee29d7bdd49a6e7f9779", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.9852713854998424, "ground_truth": 0}, {"key": "f372b28e3d1f74d60aa8ee29d7bdd49a6e7f9779", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.9967269352800996, "ground_truth": 0}, {"key": "f372b28e3d1f74d60aa8ee29d7bdd49a6e7f9779", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.9742394432470278, "ground_truth": 0}, {"key": "f372b28e3d1f74d60aa8ee29d7bdd49a6e7f9779", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.9895109096561068, "ground_truth": 0}, {"key": "f372b28e3d1f74d60aa8ee29d7bdd49a6e7f9779", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.9748211582103912, "ground_truth": 0}, {"key": "fbcaa7519e9ff82193afbaed67d8706f2350125f", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.8489722120898272, "ground_truth": 0}, {"key": "fbcaa7519e9ff82193afbaed67d8706f2350125f", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.8688267736168762, "ground_truth": 0}, {"key": "fbcaa7519e9ff82193afbaed67d8706f2350125f", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.8624675340253212, "ground_truth": 0}, {"key": "fbcaa7519e9ff82193afbaed67d8706f2350125f", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.7892336760972042, "ground_truth": 0}, {"key": "fbcaa7519e9ff82193afbaed67d8706f2350125f", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.8233283991136934, "ground_truth": 0}, {"key": "5ebd041d89a2ba41b387c30293f0657eef746910", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.6057990562707778, "ground_truth": 0}, {"key": "5ebd041d89a2ba41b387c30293f0657eef746910", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.38306414557170865, "ground_truth": 0}, {"key": "5ebd041d89a2ba41b387c30293f0657eef746910", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.41869688261768073, "ground_truth": 0}, {"key": "5ebd041d89a2ba41b387c30293f0657eef746910", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.5389832211665248, "ground_truth": 0}, {"key": "5ebd041d89a2ba41b387c30293f0657eef746910", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.373875795443572, "ground_truth": 0}, {"key": "ac4ae79796d05506dabe4380c24f7dd423e09965", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.5370413773537432, "ground_truth": 0}, {"key": "ac4ae79796d05506dabe4380c24f7dd423e09965", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.5563995680526185, "ground_truth": 0}, {"key": "ac4ae79796d05506dabe4380c24f7dd423e09965", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.6636689720636999, "ground_truth": 0}, {"key": "ac4ae79796d05506dabe4380c24f7dd423e09965", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.737158152724748, "ground_truth": 0}, {"key": "ac4ae79796d05506dabe4380c24f7dd423e09965", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.6757645823427172, "ground_truth": 0}, {"key": "62827a1a377491d88adcbac25ecf14a64b5f997b", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.7662936415493444, "ground_truth": 0}, {"key": "62827a1a377491d88adcbac25ecf14a64b5f997b", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.7676898604765326, "ground_truth": 0}, {"key": "62827a1a377491d88adcbac25ecf14a64b5f997b", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.8539127494381091, "ground_truth": 0}, {"key": "62827a1a377491d88adcbac25ecf14a64b5f997b", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.841825641665631, "ground_truth": 0}, {"key": "62827a1a377491d88adcbac25ecf14a64b5f997b", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.7662936617139924, "ground_truth": 0}, {"key": "d42463e1093a92ec4dbd20edd8f4bf3306f00f3f", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.2351083923461634, "ground_truth": 0}, {"key": "d42463e1093a92ec4dbd20edd8f4bf3306f00f3f", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.30902371243231797, "ground_truth": 0}, {"key": "d42463e1093a92ec4dbd20edd8f4bf3306f00f3f", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.1778108783277699, "ground_truth": 0}, {"key": "d42463e1093a92ec4dbd20edd8f4bf3306f00f3f", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.2658804644702213, "ground_truth": 0}, {"key": "d42463e1093a92ec4dbd20edd8f4bf3306f00f3f", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.33111973618554874, "ground_truth": 0}, {"key": "4b0eda92463958cce8c6b2537db39088e1254552", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.6706082821619856, "ground_truth": 0}, {"key": "4b0eda92463958cce8c6b2537db39088e1254552", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.7853085801385213, "ground_truth": 0}, {"key": "4b0eda92463958cce8c6b2537db39088e1254552", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.7534666619940512, "ground_truth": 0}, {"key": "4b0eda92463958cce8c6b2537db39088e1254552", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.7839884735443526, "ground_truth": 0}, {"key": "4b0eda92463958cce8c6b2537db39088e1254552", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.8056321806136081, "ground_truth": 0}, {"key": "e117408ad19cc69e15b1e21b9ae54f10c07223ce", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.7041601482236175, "ground_truth": 0}, {"key": "e117408ad19cc69e15b1e21b9ae54f10c07223ce", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.850964710708195, "ground_truth": 0}, {"key": "e117408ad19cc69e15b1e21b9ae54f10c07223ce", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.5621765333552504, "ground_truth": 0}, {"key": "e117408ad19cc69e15b1e21b9ae54f10c07223ce", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.6825737086799983, "ground_truth": 0}, {"key": "e117408ad19cc69e15b1e21b9ae54f10c07223ce", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.8519528176011816, "ground_truth": 0}, {"key": "3c5b68b58c34853baa534d1265ec7fde00d4eb4e", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.7217432028672958, "ground_truth": 0}, {"key": "3c5b68b58c34853baa534d1265ec7fde00d4eb4e", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.6926419838224098, "ground_truth": 0}, {"key": "3c5b68b58c34853baa534d1265ec7fde00d4eb4e", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.863391608137535, "ground_truth": 0}, {"key": "3c5b68b58c34853baa534d1265ec7fde00d4eb4e", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.43206339197895294, "ground_truth": 0}, {"key": "3c5b68b58c34853baa534d1265ec7fde00d4eb4e", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.9453993968215384, "ground_truth": 0}, {"key": "6c3d2feed04c75063d182103f0585c45da9aaa1b", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.6315942954023099, "ground_truth": 0}, {"key": "6c3d2feed04c75063d182103f0585c45da9aaa1b", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.41111085504551437, "ground_truth": 0}, {"key": "6c3d2feed04c75063d182103f0585c45da9aaa1b", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.3539863074485404, "ground_truth": 0}, {"key": "6c3d2feed04c75063d182103f0585c45da9aaa1b", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.44167302897340077, "ground_truth": 0}, {"key": "6c3d2feed04c75063d182103f0585c45da9aaa1b", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.4571367321655832, "ground_truth": 0}, {"key": "4fa1c0bd7f86368d7ae7730d95ff7e73dc9172da", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.7704647802509378, "ground_truth": 0}, {"key": "4fa1c0bd7f86368d7ae7730d95ff7e73dc9172da", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.8652240817201702, "ground_truth": 0}, {"key": "4fa1c0bd7f86368d7ae7730d95ff7e73dc9172da", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.9394706064620414, "ground_truth": 0}, {"key": "4fa1c0bd7f86368d7ae7730d95ff7e73dc9172da", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.8832359913502436, "ground_truth": 0}, {"key": "4fa1c0bd7f86368d7ae7730d95ff7e73dc9172da", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.926303731083949, "ground_truth": 0}, {"key": "282f1910bd57e50d4401c695ebe75b817de68548", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.8031738012062551, "ground_truth": 0}, {"key": "282f1910bd57e50d4401c695ebe75b817de68548", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.8529354695293991, "ground_truth": 0}, {"key": "282f1910bd57e50d4401c695ebe75b817de68548", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.9005297831741358, "ground_truth": 0}, {"key": "282f1910bd57e50d4401c695ebe75b817de68548", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.8976953024644945, "ground_truth": 0}, {"key": "282f1910bd57e50d4401c695ebe75b817de68548", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.9462003592218118, "ground_truth": 0}, {"key": "af2d712599be471d1ba0b91fa18c347220ca595d", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.372048793414223, "ground_truth": 0}, {"key": "af2d712599be471d1ba0b91fa18c347220ca595d", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.721743193954257, "ground_truth": 0}, {"key": "af2d712599be471d1ba0b91fa18c347220ca595d", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.5117166166455468, "ground_truth": 0}, {"key": "af2d712599be471d1ba0b91fa18c347220ca595d", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.3380771135826669, "ground_truth": 0}, {"key": "af2d712599be471d1ba0b91fa18c347220ca595d", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.6791787062020732, "ground_truth": 0}, {"key": "e3dd06d326c8d53722bdc5c8428e29c68a60d0d5", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.5755879995645048, "ground_truth": 0}, {"key": "e3dd06d326c8d53722bdc5c8428e29c68a60d0d5", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.7476159523405714, "ground_truth": 0}, {"key": "e3dd06d326c8d53722bdc5c8428e29c68a60d0d5", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.7786493006206746, "ground_truth": 0}, {"key": "e3dd06d326c8d53722bdc5c8428e29c68a60d0d5", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.49023562395844716, "ground_truth": 0}, {"key": "e3dd06d326c8d53722bdc5c8428e29c68a60d0d5", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.7154239974513039, "ground_truth": 0}, {"key": "493fa8c40d1bc26ed1d25633c779b13bc33efdba", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.7577943911910228, "ground_truth": 0}, {"key": "493fa8c40d1bc26ed1d25633c779b13bc33efdba", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.8428631449717822, "ground_truth": 0}, {"key": "493fa8c40d1bc26ed1d25633c779b13bc33efdba", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.9219218353216472, "ground_truth": 0}, {"key": "493fa8c40d1bc26ed1d25633c779b13bc33efdba", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.7170119012074041, "ground_truth": 0}, {"key": "493fa8c40d1bc26ed1d25633c779b13bc33efdba", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.7025300391375514, "ground_truth": 0}, {"key": "56d7d67bb0fc32ee71cc006b915244776d883661", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.7310585599818197, "ground_truth": 0}, {"key": "56d7d67bb0fc32ee71cc006b915244776d883661", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.5156199121941889, "ground_truth": 0}, {"key": "56d7d67bb0fc32ee71cc006b915244776d883661", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.4941408873583273, "ground_truth": 0}, {"key": "56d7d67bb0fc32ee71cc006b915244776d883661", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.2538610101176347, "ground_truth": 0}, {"key": "56d7d67bb0fc32ee71cc006b915244776d883661", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.3793784049810677, "ground_truth": 0}, {"key": "2b08ee205946dc0bb6ffe0db654cbbba1199eb28", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.8175744827017833, "ground_truth": 0}, {"key": "2b08ee205946dc0bb6ffe0db654cbbba1199eb28", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.8568122982808082, "ground_truth": 0}, {"key": "2b08ee205946dc0bb6ffe0db654cbbba1199eb28", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.901920683888443, "ground_truth": 0}, {"key": "2b08ee205946dc0bb6ffe0db654cbbba1199eb28", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.8019358312561256, "ground_truth": 0}, {"key": "2b08ee205946dc0bb6ffe0db654cbbba1199eb28", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.9136765215158662, "ground_truth": 0}, {"key": "782c4bdaee73189103d2e05748717b3ea0e89e5d", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.8489721882131103, "ground_truth": 0}, {"key": "782c4bdaee73189103d2e05748717b3ea0e89e5d", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.8732148227573775, "ground_truth": 0}, {"key": "782c4bdaee73189103d2e05748717b3ea0e89e5d", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.8164063677622704, "ground_truth": 0}, {"key": "782c4bdaee73189103d2e05748717b3ea0e89e5d", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.8300437717365045, "ground_truth": 0}, {"key": "782c4bdaee73189103d2e05748717b3ea0e89e5d", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.8255897226323058, "ground_truth": 0}, {"key": "87385fb51ac9eaf76e8421723c94410f724750fc", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.6057990511433712, "ground_truth": 0}, {"key": "87385fb51ac9eaf76e8421723c94410f724750fc", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.6808786251656701, "ground_truth": 0}, {"key": "87385fb51ac9eaf76e8421723c94410f724750fc", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.5583269836612562, "ground_truth": 0}, {"key": "87385fb51ac9eaf76e8421723c94410f724750fc", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.5175708858680919, "ground_truth": 0}, {"key": "87385fb51ac9eaf76e8421723c94410f724750fc", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.39233682199620007, "ground_truth": 0}, {"key": "20528eb48341b50c0083fcf5a9d114b39040e5c1", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.5640984818723079, "ground_truth": 0}, {"key": "20528eb48341b50c0083fcf5a9d114b39040e5c1", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.638835292130044, "ground_truth": 0}, {"key": "20528eb48341b50c0083fcf5a9d114b39040e5c1", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.6150878627651627, "ground_truth": 0}, {"key": "20528eb48341b50c0083fcf5a9d114b39040e5c1", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.7170118652558801, "ground_truth": 0}, {"key": "20528eb48341b50c0083fcf5a9d114b39040e5c1", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.7295197851360052, "ground_truth": 0}, {"key": "412630c97420afb50e5278d3406e0cf4b08d0b77", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.5467381493124028, "ground_truth": 0}, {"key": "412630c97420afb50e5278d3406e0cf4b08d0b77", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.43014734451345216, "ground_truth": 0}, {"key": "412630c97420afb50e5278d3406e0cf4b08d0b77", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.5, "ground_truth": 0}, {"key": "412630c97420afb50e5278d3406e0cf4b08d0b77", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.581303100703759, "ground_truth": 0}, {"key": "412630c97420afb50e5278d3406e0cf4b08d0b77", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.4571367171972519, "ground_truth": 0}, {"key": "dcd60a85e1e17ec0163a925c9412d480fd08072f", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.5331543904453163, "ground_truth": 0}, {"key": "dcd60a85e1e17ec0163a925c9412d480fd08072f", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.8469578448178838, "ground_truth": 0}, {"key": "dcd60a85e1e17ec0163a925c9412d480fd08072f", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.6513548592161564, "ground_truth": 0}, {"key": "dcd60a85e1e17ec0163a925c9412d480fd08072f", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.622459353808961, "ground_truth": 0}, {"key": "dcd60a85e1e17ec0163a925c9412d480fd08072f", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.7074046973876201, "ground_truth": 0}, {"key": "805644d370fae7b0492174c54c00e86eff742735", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.5983121931102104, "ground_truth": 0}, {"key": "805644d370fae7b0492174c54c00e86eff742735", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.8732148204581744, "ground_truth": 0}, {"key": "805644d370fae7b0492174c54c00e86eff742735", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.42823341662457154, "ground_truth": 0}, {"key": "805644d370fae7b0492174c54c00e86eff742735", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.5851011363092027, "ground_truth": 0}, {"key": "805644d370fae7b0492174c54c00e86eff742735", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.8031738072604108, "ground_truth": 0}, {"key": "3aa0ef8cac31a60076c43a9484792b59372edb64", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.5926665933863394, "ground_truth": 0}, {"key": "3aa0ef8cac31a60076c43a9484792b59372edb64", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.8529354767055102, "ground_truth": 0}, {"key": "3aa0ef8cac31a60076c43a9484792b59372edb64", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.679178702295456, "ground_truth": 0}, {"key": "3aa0ef8cac31a60076c43a9484792b59372edb64", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.4359015138890302, "ground_truth": 0}, {"key": "3aa0ef8cac31a60076c43a9484792b59372edb64", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.8469578511784293, "ground_truth": 0}, {"key": "4cf51ce9372dff8ff7f44f098eab1c1d7569af7a", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.3647775666215985, "ground_truth": 0}, {"key": "4cf51ce9372dff8ff7f44f098eab1c1d7569af7a", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.5621765021517502, "ground_truth": 0}, {"key": "4cf51ce9372dff8ff7f44f098eab1c1d7569af7a", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.6548947009864234, "ground_truth": 0}, {"key": "4cf51ce9372dff8ff7f44f098eab1c1d7569af7a", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.4035668825033134, "ground_truth": 0}, {"key": "4cf51ce9372dff8ff7f44f098eab1c1d7569af7a", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.5736784183445102, "ground_truth": 0}, {"key": "ea06fd0b25cb9793397a51de73fd83f91b4323fa", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.6926419903305671, "ground_truth": 0}, {"key": "ea06fd0b25cb9793397a51de73fd83f91b4323fa", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.7563575673268397, "ground_truth": 0}, {"key": "ea06fd0b25cb9793397a51de73fd83f91b4323fa", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.6406358633629328, "ground_truth": 0}, {"key": "ea06fd0b25cb9793397a51de73fd83f91b4323fa", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.7461389777971238, "ground_truth": 0}, {"key": "ea06fd0b25cb9793397a51de73fd83f91b4323fa", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.7170118835680325, "ground_truth": 0}, {"key": "a150e93fa52eaba281aae9eabe28b3ee4155f296", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.2553436515824287, "ground_truth": 0}, {"key": "a150e93fa52eaba281aae9eabe28b3ee4155f296", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.14223189172959766, "ground_truth": 0}, {"key": "a150e93fa52eaba281aae9eabe28b3ee4155f296", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.10669059789189857, "ground_truth": 0}, {"key": "a150e93fa52eaba281aae9eabe28b3ee4155f296", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.2173375004496692, "ground_truth": 0}, {"key": "a150e93fa52eaba281aae9eabe28b3ee4155f296", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.2494472407927883, "ground_truth": 0}, {"key": "a0a84718168357049273f6e65133fd06e67cd6d2", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.7994423317975846, "ground_truth": 0}, {"key": "a0a84718168357049273f6e65133fd06e67cd6d2", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.7549149866799353, "ground_truth": 0}, {"key": "a0a84718168357049273f6e65133fd06e67cd6d2", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.7008947937422382, "ground_truth": 0}, {"key": "a0a84718168357049273f6e65133fd06e67cd6d2", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.6076631491951695, "ground_truth": 0}, {"key": "a0a84718168357049273f6e65133fd06e67cd6d2", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.81523249276906, "ground_truth": 0}, {"key": "b5833a27ee69d7540435e3c70af040c2b743f541", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.3433417296190137, "ground_truth": 0}, {"key": "b5833a27ee69d7540435e3c70af040c2b743f541", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.38306415968395646, "ground_truth": 0}, {"key": "b5833a27ee69d7540435e3c70af040c2b743f541", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.5506073696965122, "ground_truth": 0}, {"key": "b5833a27ee69d7540435e3c70af040c2b743f541", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.3468731021242945, "ground_truth": 0}, {"key": "b5833a27ee69d7540435e3c70af040c2b743f541", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.2735743944428442, "ground_truth": 0}, {"key": "98dbba54da2a05bb04320aa0e4fb05fba3d75b63", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.5926666025307994, "ground_truth": 0}, {"key": "98dbba54da2a05bb04320aa0e4fb05fba3d75b63", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.7476159407027119, "ground_truth": 0}, {"key": "98dbba54da2a05bb04320aa0e4fb05fba3d75b63", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.7154239917595464, "ground_truth": 0}, {"key": "98dbba54da2a05bb04320aa0e4fb05fba3d75b63", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.7310585832887283, "ground_truth": 0}, {"key": "98dbba54da2a05bb04320aa0e4fb05fba3d75b63", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.660172411581077, "ground_truth": 0}, {"key": "4a30d8e9ba08a56c1d503d719525113545c414e3", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.653126900306529, "ground_truth": 0}, {"key": "4a30d8e9ba08a56c1d503d719525113545c414e3", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.804405913601676, "ground_truth": 0}, {"key": "4a30d8e9ba08a56c1d503d719525113545c414e3", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.7813306250449844, "ground_truth": 0}, {"key": "4a30d8e9ba08a56c1d503d719525113545c414e3", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.34334173235678517, "ground_truth": 0}, {"key": "4a30d8e9ba08a56c1d503d719525113545c414e3", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.8006919944269425, "ground_truth": 0}, {"key": "c3acabb0c18cc7615eb3796406500fba1b148d3d", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.36840570373357734, "ground_truth": 0}, {"key": "c3acabb0c18cc7615eb3796406500fba1b148d3d", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.2751297247471131, "ground_truth": 0}, {"key": "c3acabb0c18cc7615eb3796406500fba1b148d3d", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.3191213979082949, "ground_truth": 0}, {"key": "c3acabb0c18cc7615eb3796406500fba1b148d3d", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.5621765000139038, "ground_truth": 0}, {"key": "c3acabb0c18cc7615eb3796406500fba1b148d3d", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.45132650976610506, "ground_truth": 0}, {"key": "1c1acc74329fe61636f900df9dbcef5ed695e5c9", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.8031738025611074, "ground_truth": 0}, {"key": "1c1acc74329fe61636f900df9dbcef5ed695e5c9", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.9219218395041432, "ground_truth": 0}, {"key": "1c1acc74329fe61636f900df9dbcef5ed695e5c9", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.6976089090534131, "ground_truth": 0}, {"key": "1c1acc74329fe61636f900df9dbcef5ed695e5c9", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.8459424337876357, "ground_truth": 0}, {"key": "1c1acc74329fe61636f900df9dbcef5ed695e5c9", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.6791786519096036, "ground_truth": 0}, {"key": "f70a7abb6c5b0ef383ea12a4d9ca046a5bd854e5", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.6242935176121462, "ground_truth": 0}, {"key": "f70a7abb6c5b0ef383ea12a4d9ca046a5bd854e5", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.46879062586260284, "ground_truth": 0}, {"key": "f70a7abb6c5b0ef383ea12a4d9ca046a5bd854e5", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.5097644068035843, "ground_truth": 0}, {"key": "f70a7abb6c5b0ef383ea12a4d9ca046a5bd854e5", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.4649015399642877, "ground_truth": 0}, {"key": "f70a7abb6c5b0ef383ea12a4d9ca046a5bd854e5", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.5869964168575909, "ground_truth": 0}, {"key": "a3dd38ec7bc9d7e8423b96d8fd0641a2a5d5c984", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.6548947215385775, "ground_truth": 0}, {"key": "a3dd38ec7bc9d7e8423b96d8fd0641a2a5d5c984", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.7325918322391095, "ground_truth": 0}, {"key": "a3dd38ec7bc9d7e8423b96d8fd0641a2a5d5c984", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.7386690832359386, "ground_truth": 0}, {"key": "a3dd38ec7bc9d7e8423b96d8fd0641a2a5d5c984", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.66017237181159, "ground_truth": 0}, {"key": "a3dd38ec7bc9d7e8423b96d8fd0641a2a5d5c984", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.6584175008171742, "ground_truth": 0}, {"key": "654c6b29b96d2a5a818d91400c20f838b0e8b6df", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.30074557215745, "ground_truth": 0}, {"key": "654c6b29b96d2a5a818d91400c20f838b0e8b6df", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.2583259619152631, "ground_truth": 0}, {"key": "654c6b29b96d2a5a818d91400c20f838b0e8b6df", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.18010666499510944, "ground_truth": 0}, {"key": "654c6b29b96d2a5a818d91400c20f838b0e8b6df", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.40922078876030177, "ground_truth": 0}, {"key": "654c6b29b96d2a5a818d91400c20f838b0e8b6df", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.24077460188132999, "ground_truth": 0}, {"key": "764d9ce99a1e3f79d95fbc4b68adbce14e7f8bcd", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.9219218383110274, "ground_truth": 0}, {"key": "764d9ce99a1e3f79d95fbc4b68adbce14e7f8bcd", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.9594592589137997, "ground_truth": 0}, {"key": "764d9ce99a1e3f79d95fbc4b68adbce14e7f8bcd", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.8175744650734004, "ground_truth": 0}, {"key": "764d9ce99a1e3f79d95fbc4b68adbce14e7f8bcd", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.7853085820441299, "ground_truth": 0}, {"key": "764d9ce99a1e3f79d95fbc4b68adbce14e7f8bcd", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.8175744769518741, "ground_truth": 0}, {"key": "f16446db34e2861f0450dfa34d8cdda541ab7b19", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.300745588349463, "ground_truth": 0}, {"key": "f16446db34e2861f0450dfa34d8cdda541ab7b19", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.6566582586188764, "ground_truth": 0}, {"key": "f16446db34e2861f0450dfa34d8cdda541ab7b19", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.5813030941111035, "ground_truth": 0}, {"key": "f16446db34e2861f0450dfa34d8cdda541ab7b19", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.5019531348492711, "ground_truth": 0}, {"key": "f16446db34e2861f0450dfa34d8cdda541ab7b19", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.6584174942934929, "ground_truth": 0}, {"key": "3e910c5b8425cd7c871a402a32ca44680b53ce5e", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.276690531289142, "ground_truth": 0}, {"key": "3e910c5b8425cd7c871a402a32ca44680b53ce5e", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.4416729911524745, "ground_truth": 0}, {"key": "3e910c5b8425cd7c871a402a32ca44680b53ce5e", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.4378235200657578, "ground_truth": 0}, {"key": "3e910c5b8425cd7c871a402a32ca44680b53ce5e", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.2107662853214373, "ground_truth": 0}, {"key": "3e910c5b8425cd7c871a402a32ca44680b53ce5e", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.4186969241841252, "ground_truth": 0}, {"key": "973c14551fc97a1eef094bd0f33356d9e6836234", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.5563995691144145, "ground_truth": 0}, {"key": "973c14551fc97a1eef094bd0f33356d9e6836234", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.6757646179334396, "ground_truth": 0}, {"key": "973c14551fc97a1eef094bd0f33356d9e6836234", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.4921881560218324, "ground_truth": 0}, {"key": "973c14551fc97a1eef094bd0f33356d9e6836234", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.7106282865800784, "ground_truth": 0}, {"key": "973c14551fc97a1eef094bd0f33356d9e6836234", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.6039318327790586, "ground_truth": 0}, {"key": "725938611c7dca6f876ada93b1d68b29ad25ce38", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.5832033596201345, "ground_truth": 0}, {"key": "725938611c7dca6f876ada93b1d68b29ad25ce38", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.44552954318585763, "ground_truth": 0}, {"key": "725938611c7dca6f876ada93b1d68b29ad25ce38", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.6842640122219886, "ground_truth": 0}, {"key": "725938611c7dca6f876ada93b1d68b29ad25ce38", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.687629975438858, "ground_truth": 0}, {"key": "725938611c7dca6f876ada93b1d68b29ad25ce38", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.5813030983737278, "ground_truth": 0}, {"key": "28dbcf0c8624d9914a4e4292f872f17b063547c2", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.9693241994659797, "ground_truth": 0}, {"key": "28dbcf0c8624d9914a4e4292f872f17b063547c2", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.8799743798777006, "ground_truth": 0}, {"key": "28dbcf0c8624d9914a4e4292f872f17b063547c2", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.9671630477005235, "ground_truth": 0}, {"key": "28dbcf0c8624d9914a4e4292f872f17b063547c2", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.8643104561197824, "ground_truth": 0}, {"key": "28dbcf0c8624d9914a4e4292f872f17b063547c2", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.9252299522473413, "ground_truth": 0}, {"key": "4567b2098569ee4346cfdede5819257af4ee9c0f", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.7122321844052952, "ground_truth": 0}, {"key": "4567b2098569ee4346cfdede5819257af4ee9c0f", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.5389831944658121, "ground_truth": 0}, {"key": "4567b2098569ee4346cfdede5819257af4ee9c0f", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.39981166395446005, "ground_truth": 0}, {"key": "4567b2098569ee4346cfdede5819257af4ee9c0f", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.5097643649710815, "ground_truth": 0}, {"key": "4567b2098569ee4346cfdede5819257af4ee9c0f", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.6370308033299911, "ground_truth": 0}, {"key": "d0404188997ef57e0355b18fb867599b89c80407", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.8198933566973661, "ground_truth": 0}, {"key": "d0404188997ef57e0355b18fb867599b89c80407", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.8705972658930871, "ground_truth": 0}, {"key": "d0404188997ef57e0355b18fb867599b89c80407", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.7956581075495942, "ground_truth": 0}, {"key": "d0404188997ef57e0355b18fb867599b89c80407", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.8568122950512473, "ground_truth": 0}, {"key": "d0404188997ef57e0355b18fb867599b89c80407", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.7732163549507256, "ground_truth": 0}, {"key": "ab10b3f8c4a6cca7aea94298447b13bc0721fe69", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.9073122205581731, "ground_truth": 0}, {"key": "ab10b3f8c4a6cca7aea94298447b13bc0721fe69", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.8006920244028439, "ground_truth": 0}, {"key": "ab10b3f8c4a6cca7aea94298447b13bc0721fe69", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.853912750896329, "ground_truth": 0}, {"key": "ab10b3f8c4a6cca7aea94298447b13bc0721fe69", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.8714748568609676, "ground_truth": 0}, {"key": "ab10b3f8c4a6cca7aea94298447b13bc0721fe69", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.6169358204864763, "ground_truth": 0}, {"key": "7c11a3353593edde95bae0ee6178fb1d1855baed", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.2893716832634551, "ground_truth": 0}, {"key": "7c11a3353593edde95bae0ee6178fb1d1855baed", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.39420094360807595, "ground_truth": 0}, {"key": "7c11a3353593edde95bae0ee6178fb1d1855baed", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.2991051908326466, "ground_truth": 0}, {"key": "7c11a3353593edde95bae0ee6178fb1d1855baed", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.5370414119512639, "ground_truth": 0}, {"key": "7c11a3353593edde95bae0ee6178fb1d1855baed", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.48047865588755534, "ground_truth": 0}, {"key": "487b272b94a620f9660e89bbf6ebab3ffdf1bf06", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.4843800674332377, "ground_truth": 0}, {"key": "487b272b94a620f9660e89bbf6ebab3ffdf1bf06", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.3174262577280278, "ground_truth": 0}, {"key": "487b272b94a620f9660e89bbf6ebab3ffdf1bf06", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.36296921576354746, "ground_truth": 0}, {"key": "487b272b94a620f9660e89bbf6ebab3ffdf1bf06", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.30569732130659305, "ground_truth": 0}, {"key": "487b272b94a620f9660e89bbf6ebab3ffdf1bf06", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.33633104424767396, "ground_truth": 0}, {"key": "e1b6f4701835710d3f518729188754fcd7061289", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.8044059116596822, "ground_truth": 0}, {"key": "e1b6f4701835710d3f518729188754fcd7061289", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.4035668760117405, "ground_truth": 0}, {"key": "e1b6f4701835710d3f518729188754fcd7061289", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.27982849272546095, "ground_truth": 0}, {"key": "e1b6f4701835710d3f518729188754fcd7061289", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.3433417502587753, "ground_truth": 0}, {"key": "e1b6f4701835710d3f518729188754fcd7061289", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.36296918005844475, "ground_truth": 0}, {"key": "45027afbe54056c567ca8a48906dd06200f6d8c1", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.949669367739723, "ground_truth": 0}, {"key": "45027afbe54056c567ca8a48906dd06200f6d8c1", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.9666631761573439, "ground_truth": 0}, {"key": "45027afbe54056c567ca8a48906dd06200f6d8c1", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.9569571476848784, "ground_truth": 0}, {"key": "45027afbe54056c567ca8a48906dd06200f6d8c1", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.9309620730394452, "ground_truth": 0}, {"key": "45027afbe54056c567ca8a48906dd06200f6d8c1", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.9734434287186586, "ground_truth": 0}, {"key": "e8c2d4a1d20efb0606506435ebcbf486e9eb4146", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.6876299962111029, "ground_truth": 0}, {"key": "e8c2d4a1d20efb0606506435ebcbf486e9eb4146", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.6636689430121515, "ground_truth": 0}, {"key": "e8c2d4a1d20efb0606506435ebcbf486e9eb4146", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.3415824998503128, "ground_truth": 0}, {"key": "e8c2d4a1d20efb0606506435ebcbf486e9eb4146", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.5467381397424821, "ground_truth": 0}, {"key": "e8c2d4a1d20efb0606506435ebcbf486e9eb4146", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.5175708833719489, "ground_truth": 0}, {"key": "da0ea6b7eae20528c7ec822fb77d8e8f78ba09b8", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.43398148344353965, "ground_truth": 0}, {"key": "da0ea6b7eae20528c7ec822fb77d8e8f78ba09b8", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.6406358635594286, "ground_truth": 0}, {"key": "da0ea6b7eae20528c7ec822fb77d8e8f78ba09b8", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.668880266542681, "ground_truth": 0}, {"key": "da0ea6b7eae20528c7ec822fb77d8e8f78ba09b8", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.4590761270140392, "ground_truth": 0}, {"key": "da0ea6b7eae20528c7ec822fb77d8e8f78ba09b8", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.56793661358456, "ground_truth": 0}, {"key": "42ab0385b3bb93236804c2abc9ff261b6ec79872", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.5679365974654432, "ground_truth": 0}, {"key": "42ab0385b3bb93236804c2abc9ff261b6ec79872", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.6261241784459234, "ground_truth": 0}, {"key": "42ab0385b3bb93236804c2abc9ff261b6ec79872", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.7154240146139917, "ground_truth": 0}, {"key": "42ab0385b3bb93236804c2abc9ff261b6ec79872", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.7090191303584088, "ground_truth": 0}, {"key": "42ab0385b3bb93236804c2abc9ff261b6ec79872", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.8128673176136455, "ground_truth": 0}, {"key": "3ad31f0dd26f2dce06da1c10ced8d601bd5594c5", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.32252601655798774, "ground_truth": 0}, {"key": "3ad31f0dd26f2dce06da1c10ced8d601bd5594c5", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.23091975034897885, "ground_truth": 0}, {"key": "3ad31f0dd26f2dce06da1c10ced8d601bd5594c5", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.5234203512201959, "ground_truth": 0}, {"key": "3ad31f0dd26f2dce06da1c10ced8d601bd5594c5", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.18242552984796798, "ground_truth": 0}, {"key": "3ad31f0dd26f2dce06da1c10ced8d601bd5594c5", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.20434190319906065, "ground_truth": 0}, {"key": "a142b867b5b52449a790e8a2942654fd880cd2e4", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.9235923123124956, "ground_truth": 0}, {"key": "a142b867b5b52449a790e8a2942654fd880cd2e4", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.9600626830837977, "ground_truth": 0}, {"key": "a142b867b5b52449a790e8a2942654fd880cd2e4", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.899827778094973, "ground_truth": 0}, {"key": "a142b867b5b52449a790e8a2942654fd880cd2e4", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.8187368004479547, "ground_truth": 0}, {"key": "a142b867b5b52449a790e8a2942654fd880cd2e4", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.9161096149658543, "ground_truth": 0}, {"key": "04b39ee42fdc4284e402fbf7cdc7b825748f38b5", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.9609517003369914, "ground_truth": 0}, {"key": "04b39ee42fdc4284e402fbf7cdc7b825748f38b5", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.9412234383401651, "ground_truth": 0}, {"key": "04b39ee42fdc4284e402fbf7cdc7b825748f38b5", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.9376689588751601, "ground_truth": 0}, {"key": "04b39ee42fdc4284e402fbf7cdc7b825748f38b5", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.8418256411361881, "ground_truth": 0}, {"key": "04b39ee42fdc4284e402fbf7cdc7b825748f38b5", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.9477691428178008, "ground_truth": 0}, {"key": "ddafab36467762e9f1856687a7ef0e801243dace", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.17553805469365721, "ground_truth": 0}, {"key": "ddafab36467762e9f1856687a7ef0e801243dace", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.3629691905877181, "ground_truth": 0}, {"key": "ddafab36467762e9f1856687a7ef0e801243dace", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.22678362311048894, "ground_truth": 0}, {"key": "ddafab36467762e9f1856687a7ef0e801243dace", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.3720487965438216, "ground_truth": 0}, {"key": "ddafab36467762e9f1856687a7ef0e801243dace", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.25683199497687104, "ground_truth": 0}, {"key": "6c177720c8623edcaefc45111018f98811c29693", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.6442251188859281, "ground_truth": 0}, {"key": "6c177720c8623edcaefc45111018f98811c29693", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.6388352806597956, "ground_truth": 0}, {"key": "6c177720c8623edcaefc45111018f98811c29693", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.8539127504144423, "ground_truth": 0}, {"key": "6c177720c8623edcaefc45111018f98811c29693", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.6548947205497592, "ground_truth": 0}, {"key": "6c177720c8623edcaefc45111018f98811c29693", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.47657965783604456, "ground_truth": 0}, {"key": "5365dfc7c7079ade7d090530f5ce0d8995a8f1cc", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.8679338555459964, "ground_truth": 0}, {"key": "5365dfc7c7079ade7d090530f5ce0d8995a8f1cc", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.8783142367065457, "ground_truth": 0}, {"key": "5365dfc7c7079ade7d090530f5ce0d8995a8f1cc", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.8947894649558743, "ground_truth": 0}, {"key": "5365dfc7c7079ade7d090530f5ce0d8995a8f1cc", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.8469578421023062, "ground_truth": 0}, {"key": "5365dfc7c7079ade7d090530f5ce0d8995a8f1cc", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.7577943736446346, "ground_truth": 0}, {"key": "6235695e9e69aa35c488636fc63bae84d1e2ca1f", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.6388352714843251, "ground_truth": 0}, {"key": "6235695e9e69aa35c488636fc63bae84d1e2ca1f", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.48242911579365727, "ground_truth": 0}, {"key": "6235695e9e69aa35c488636fc63bae84d1e2ca1f", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.4339814765884021, "ground_truth": 0}, {"key": "6235695e9e69aa35c488636fc63bae84d1e2ca1f", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.5907791901140249, "ground_truth": 0}, {"key": "6235695e9e69aa35c488636fc63bae84d1e2ca1f", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.29910520265943874, "ground_truth": 0}, {"key": "d954f33da49f4c839a6f4dadc446a4c30328c572", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.9086178971766206, "ground_truth": 0}, {"key": "d954f33da49f4c839a6f4dadc446a4c30328c572", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.8918110405454679, "ground_truth": 0}, {"key": "d954f33da49f4c839a6f4dadc446a4c30328c572", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.8175744723919971, "ground_truth": 0}, {"key": "d954f33da49f4c839a6f4dadc446a4c30328c572", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.7826624874225087, "ground_truth": 0}, {"key": "d954f33da49f4c839a6f4dadc446a4c30328c572", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.8568122973164929, "ground_truth": 0}, {"key": "5bdab1456ce6156a7378edaa4fa92a718cbf2568", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.6095241753301691, "ground_truth": 0}, {"key": "5bdab1456ce6156a7378edaa4fa92a718cbf2568", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.6825737124372551, "ground_truth": 0}, {"key": "5bdab1456ce6156a7378edaa4fa92a718cbf2568", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.6315942735218814, "ground_truth": 0}, {"key": "5bdab1456ce6156a7378edaa4fa92a718cbf2568", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.6020615839734742, "ground_truth": 0}, {"key": "5bdab1456ce6156a7378edaa4fa92a718cbf2568", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.79182105684487, "ground_truth": 0}, {"key": "c03cd67baa8d84240b962876a5aaa2036d4f5275", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.5544704627022632, "ground_truth": 0}, {"key": "c03cd67baa8d84240b962876a5aaa2036d4f5275", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.6495786405273745, "ground_truth": 0}, {"key": "c03cd67baa8d84240b962876a5aaa2036d4f5275", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.7620701131590746, "ground_truth": 0}, {"key": "c03cd67baa8d84240b962876a5aaa2036d4f5275", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.7371581817143021, "ground_truth": 0}, {"key": "c03cd67baa8d84240b962876a5aaa2036d4f5275", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.8489722081264451, "ground_truth": 0}, {"key": "e2847808e1990f51cd54eccd660640c44638f088", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.27357438601575357, "ground_truth": 0}, {"key": "e2847808e1990f51cd54eccd660640c44638f088", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.267408153370628, "ground_truth": 0}, {"key": "e2847808e1990f51cd54eccd660640c44638f088", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.11124121781086528, "ground_truth": 0}, {"key": "e2847808e1990f51cd54eccd660640c44638f088", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.18832398858452615, "ground_truth": 0}, {"key": "e2847808e1990f51cd54eccd660640c44638f088", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.17106118846857551, "ground_truth": 0}, {"key": "fbc2d5f3f088eda2b8128ebb12a042850f6e4f3d", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.749087223665121, "ground_truth": 0}, {"key": "fbc2d5f3f088eda2b8128ebb12a042850f6e4f3d", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.726425588478979, "ground_truth": 0}, {"key": "fbc2d5f3f088eda2b8128ebb12a042850f6e4f3d", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.7634837615235852, "ground_truth": 0}, {"key": "fbc2d5f3f088eda2b8128ebb12a042850f6e4f3d", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.4436004234452322, "ground_truth": 0}, {"key": "fbc2d5f3f088eda2b8128ebb12a042850f6e4f3d", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.8670357610196486, "ground_truth": 0}, {"key": "6f0d219aba6227e0a69e71e7fca4b85ae761101d", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.7154239931627816, "ground_truth": 0}, {"key": "6f0d219aba6227e0a69e71e7fca4b85ae761101d", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.5563995759892876, "ground_truth": 0}, {"key": "6f0d219aba6227e0a69e71e7fca4b85ae761101d", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.6132365728192111, "ground_truth": 0}, {"key": "6f0d219aba6227e0a69e71e7fca4b85ae761101d", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.7431679928669268, "ground_truth": 0}, {"key": "6f0d219aba6227e0a69e71e7fca4b85ae761101d", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.7090191496970327, "ground_truth": 0}, {"key": "8c71492f2a3fbe7eb9c8205d65054ab14c1dbdb6", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.7122321808360416, "ground_truth": 0}, {"key": "8c71492f2a3fbe7eb9c8205d65054ab14c1dbdb6", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.7892336969257395, "ground_truth": 0}, {"key": "8c71492f2a3fbe7eb9c8205d65054ab14c1dbdb6", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.8766343844317149, "ground_truth": 0}, {"key": "8c71492f2a3fbe7eb9c8205d65054ab14c1dbdb6", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.6531269056124956, "ground_truth": 0}, {"key": "8c71492f2a3fbe7eb9c8205d65054ab14c1dbdb6", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.5486735122171454, "ground_truth": 0}, {"key": "860cea3a6afb8527d26e9234ccba560a39eff2a7", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.7620700990872011, "ground_truth": 0}, {"key": "860cea3a6afb8527d26e9234ccba560a39eff2a7", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.6460136865924666, "ground_truth": 0}, {"key": "860cea3a6afb8527d26e9234ccba560a39eff2a7", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.7476159508257143, "ground_truth": 0}, {"key": "860cea3a6afb8527d26e9234ccba560a39eff2a7", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.7994423155313708, "ground_truth": 0}, {"key": "860cea3a6afb8527d26e9234ccba560a39eff2a7", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.53704139722242, "ground_truth": 0}, {"key": "0914e3c80a676e14e225504cb759103503f3f1e0", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.9124361711063547, "ground_truth": 0}, {"key": "0914e3c80a676e14e225504cb759103503f3f1e0", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.8848377746981633, "ground_truth": 0}, {"key": "0914e3c80a676e14e225504cb759103503f3f1e0", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.8489721967022351, "ground_truth": 0}, {"key": "0914e3c80a676e14e225504cb759103503f3f1e0", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.861538212063874, "ground_truth": 0}, {"key": "0914e3c80a676e14e225504cb759103503f3f1e0", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.8732148255882545, "ground_truth": 0}, {"key": "82a0e1f034174079179821b052f33df76c781b47", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.5448014154998183, "ground_truth": 0}, {"key": "82a0e1f034174079179821b052f33df76c781b47", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.6619228546556896, "ground_truth": 0}, {"key": "82a0e1f034174079179821b052f33df76c781b47", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.6774740186071081, "ground_truth": 0}, {"key": "82a0e1f034174079179821b052f33df76c781b47", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.7386690725507146, "ground_truth": 0}, {"key": "82a0e1f034174079179821b052f33df76c781b47", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.7248702700347492, "ground_truth": 0}, {"key": "449c536051eba7070b18a7b33ebcf024891cb913", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.3647775624675218, "ground_truth": 0}, {"key": "449c536051eba7070b18a7b33ebcf024891cb913", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.5660185187232718, "ground_truth": 0}, {"key": "449c536051eba7070b18a7b33ebcf024891cb913", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.9032942051073178, "ground_truth": 0}, {"key": "449c536051eba7070b18a7b33ebcf024891cb913", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.4320633988225809, "ground_truth": 0}, {"key": "449c536051eba7070b18a7b33ebcf024891cb913", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.4746311840995112, "ground_truth": 0}, {"key": "696d5716c42ab1096cdb464da3cfcf702626a62a", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.9640516781138376, "ground_truth": 0}, {"key": "696d5716c42ab1096cdb464da3cfcf702626a62a", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.9795114457534212, "ground_truth": 0}, {"key": "696d5716c42ab1096cdb464da3cfcf702626a62a", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.9334308141148189, "ground_truth": 0}, {"key": "696d5716c42ab1096cdb464da3cfcf702626a62a", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.9759464458213959, "ground_truth": 0}, {"key": "696d5716c42ab1096cdb464da3cfcf702626a62a", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.8633916031839566, "ground_truth": 0}, {"key": "316f0f847800fdb547f7496f6095075cd610c7e4", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.9824231153138276, "ground_truth": 0}, {"key": "316f0f847800fdb547f7496f6095075cd610c7e4", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.9453993933748087, "ground_truth": 0}, {"key": "316f0f847800fdb547f7496f6095075cd610c7e4", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.9372107948527008, "ground_truth": 0}, {"key": "316f0f847800fdb547f7496f6095075cd610c7e4", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.9807288634219208, "ground_truth": 0}, {"key": "316f0f847800fdb547f7496f6095075cd610c7e4", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.9019206866648315, "ground_truth": 0}, {"key": "28e251ea722829df08d63e83824110fedcc13f8c", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.4902356225609559, "ground_truth": 0}, {"key": "28e251ea722829df08d63e83824110fedcc13f8c", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.5640984815187007, "ground_truth": 0}, {"key": "28e251ea722829df08d63e83824110fedcc13f8c", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.6584175074209012, "ground_truth": 0}, {"key": "28e251ea722829df08d63e83824110fedcc13f8c", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.455198603836776, "ground_truth": 0}, {"key": "28e251ea722829df08d63e83824110fedcc13f8c", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.687629977340173, "ground_truth": 0}, {"key": "4812698545d6a4c2243db340fad08d0b3b7fbe0b", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.8233283805759434, "ground_truth": 0}, {"key": "4812698545d6a4c2243db340fad08d0b3b7fbe0b", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.4148988525527667, "ground_truth": 0}, {"key": "4812698545d6a4c2243db340fad08d0b3b7fbe0b", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.6261241719329136, "ground_truth": 0}, {"key": "4812698545d6a4c2243db340fad08d0b3b7fbe0b", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.5832033379030261, "ground_truth": 0}, {"key": "4812698545d6a4c2243db340fad08d0b3b7fbe0b", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.7505527787705903, "ground_truth": 0}, {"key": "81651fc015f2db10f24327d11b1a3748a19466f9", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.5486734776236627, "ground_truth": 0}, {"key": "81651fc015f2db10f24327d11b1a3748a19466f9", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.5409238790656415, "ground_truth": 0}, {"key": "81651fc015f2db10f24327d11b1a3748a19466f9", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.5078118614940961, "ground_truth": 0}, {"key": "81651fc015f2db10f24327d11b1a3748a19466f9", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.7356416431542544, "ground_truth": 0}, {"key": "81651fc015f2db10f24327d11b1a3748a19466f9", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.409220783758831, "ground_truth": 0}, {"key": "f85e12129885fad0eabd6a1c6b6b24dbf8948db5", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.6442251258081404, "ground_truth": 0}, {"key": "f85e12129885fad0eabd6a1c6b6b24dbf8948db5", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.7476159523405714, "ground_truth": 0}, {"key": "f85e12129885fad0eabd6a1c6b6b24dbf8948db5", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.5525397043032184, "ground_truth": 0}, {"key": "f85e12129885fad0eabd6a1c6b6b24dbf8948db5", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.49023562395844716, "ground_truth": 0}, {"key": "f85e12129885fad0eabd6a1c6b6b24dbf8948db5", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.7154239974513039, "ground_truth": 0}, {"key": "bffa402002700855fec36f83c8c226dfe271a6af", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.63703080439373, "ground_truth": 0}, {"key": "bffa402002700855fec36f83c8c226dfe271a6af", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.6601723717981355, "ground_truth": 0}, {"key": "bffa402002700855fec36f83c8c226dfe271a6af", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.6825737499460298, "ground_truth": 0}, {"key": "bffa402002700855fec36f83c8c226dfe271a6af", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.8044059205178566, "ground_truth": 0}, {"key": "bffa402002700855fec36f83c8c226dfe271a6af", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.7416740038454387, "ground_truth": 0}, {"key": "360df256327edcaf7ce0b99314adec8b0a2c5be6", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.5621765074427202, "ground_truth": 0}, {"key": "360df256327edcaf7ce0b99314adec8b0a2c5be6", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.4921881217781551, "ground_truth": 0}, {"key": "360df256327edcaf7ce0b99314adec8b0a2c5be6", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.5983122079116874, "ground_truth": 0}, {"key": "360df256327edcaf7ce0b99314adec8b0a2c5be6", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.5964331314936907, "ground_truth": 0}, {"key": "360df256327edcaf7ce0b99314adec8b0a2c5be6", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.5964331698119502, "ground_truth": 0}, {"key": "35ae4229bbd571d86bb817df03b3784dc8cbf660", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.9105454002324006, "ground_truth": 0}, {"key": "35ae4229bbd571d86bb817df03b3784dc8cbf660", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.869714582213606, "ground_truth": 0}, {"key": "35ae4229bbd571d86bb817df03b3784dc8cbf660", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.8848377672239082, "ground_truth": 0}, {"key": "35ae4229bbd571d86bb817df03b3784dc8cbf660", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.8175744913225143, "ground_truth": 0}, {"key": "35ae4229bbd571d86bb817df03b3784dc8cbf660", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.7853085803335347, "ground_truth": 0}, {"key": "fd93b423a3805de1c259d527393fd5fb75d06a55", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.4054487296545491, "ground_truth": 0}, {"key": "fd93b423a3805de1c259d527393fd5fb75d06a55", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.41869693308596323, "ground_truth": 0}, {"key": "fd93b423a3805de1c259d527393fd5fb75d06a55", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.49218812315691285, "ground_truth": 0}, {"key": "fd93b423a3805de1c259d527393fd5fb75d06a55", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.3522017647089221, "ground_truth": 0}, {"key": "fd93b423a3805de1c259d527393fd5fb75d06a55", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.5097643723677399, "ground_truth": 0}, {"key": "646676aabe72e75add3cde2d6afa56cea64c91a4", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.9213576216967583, "ground_truth": 0}, {"key": "646676aabe72e75add3cde2d6afa56cea64c91a4", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.9740426415344171, "ground_truth": 0}, {"key": "646676aabe72e75add3cde2d6afa56cea64c91a4", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.9804313242163077, "ground_truth": 0}, {"key": "646676aabe72e75add3cde2d6afa56cea64c91a4", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.8969755694444055, "ground_truth": 0}, {"key": "646676aabe72e75add3cde2d6afa56cea64c91a4", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.9026096010668339, "ground_truth": 0}, {"key": "5acf12b2ef7771fd1cd1421acb7057d9a64be818", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.6334103003227312, "ground_truth": 0}, {"key": "5acf12b2ef7771fd1cd1421acb7057d9a64be818", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.8606036173038393, "ground_truth": 0}, {"key": "5acf12b2ef7771fd1cd1421acb7057d9a64be818", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.8019358059358059, "ground_truth": 0}, {"key": "5acf12b2ef7771fd1cd1421acb7057d9a64be818", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.47268347614458633, "ground_truth": 0}, {"key": "5acf12b2ef7771fd1cd1421acb7057d9a64be818", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.9207896759967553, "ground_truth": 0}, {"key": "0239342f05436085947bd0c5173a4636ee772b51", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.6406358723966388, "ground_truth": 0}, {"key": "0239342f05436085947bd0c5173a4636ee772b51", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.35577487611293246, "ground_truth": 0}, {"key": "0239342f05436085947bd0c5173a4636ee772b51", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.4073334017365751, "ground_truth": 0}, {"key": "0239342f05436085947bd0c5173a4636ee772b51", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.2925953095647766, "ground_truth": 0}, {"key": "0239342f05436085947bd0c5173a4636ee772b51", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.3433417380649554, "ground_truth": 0}, {"key": "1f40e358077ff22078a4e91e5114c4f86a4d52db", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.7310585631169189, "ground_truth": 0}, {"key": "1f40e358077ff22078a4e91e5114c4f86a4d52db", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.36840570503631165, "ground_truth": 0}, {"key": "1f40e358077ff22078a4e91e5114c4f86a4d52db", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.5583269869097146, "ground_truth": 0}, {"key": "1f40e358077ff22078a4e91e5114c4f86a4d52db", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.46295861768504826, "ground_truth": 0}, {"key": "1f40e358077ff22078a4e91e5114c4f86a4d52db", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.656658281524649, "ground_truth": 0}, {"key": "a8ac682f29acaad4b669781c39fb2804374b8b2b", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.6619228938141881, "ground_truth": 0}, {"key": "a8ac682f29acaad4b669781c39fb2804374b8b2b", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.6261241611688498, "ground_truth": 0}, {"key": "a8ac682f29acaad4b669781c39fb2804374b8b2b", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.8116760288548974, "ground_truth": 0}, {"key": "a8ac682f29acaad4b669781c39fb2804374b8b2b", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.8244619241492382, "ground_truth": 0}, {"key": "a8ac682f29acaad4b669781c39fb2804374b8b2b", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.5409238644758789, "ground_truth": 0}, {"key": "d4474ce9da725c1540ac826f3247f53d086808fb", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.7759445543651743, "ground_truth": 0}, {"key": "d4474ce9da725c1540ac826f3247f53d086808fb", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.7534666804914206, "ground_truth": 0}, {"key": "d4474ce9da725c1540ac826f3247f53d086808fb", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.6513548696994874, "ground_truth": 0}, {"key": "d4474ce9da725c1540ac826f3247f53d086808fb", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.8221891282549697, "ground_truth": 0}, {"key": "d4474ce9da725c1540ac826f3247f53d086808fb", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.5888891218855381, "ground_truth": 0}, {"key": "e74db6d20c456740ecb7b295c8d24489fb4f436f", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.43974732800382604, "ground_truth": 0}, {"key": "e74db6d20c456740ecb7b295c8d24489fb4f436f", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.5214711801936804, "ground_truth": 0}, {"key": "e74db6d20c456740ecb7b295c8d24489fb4f436f", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.5736784050530008, "ground_truth": 0}, {"key": "e74db6d20c456740ecb7b295c8d24489fb4f436f", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.5273165124868231, "ground_truth": 0}, {"key": "e74db6d20c456740ecb7b295c8d24489fb4f436f", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.39047584448803335, "ground_truth": 0}, {"key": "d79b790edcc3f5088161445102a656ae4adb8ab1", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.9420819110644189, "ground_truth": 0}, {"key": "d79b790edcc3f5088161445102a656ae4adb8ab1", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.6654105611441459, "ground_truth": 0}, {"key": "d79b790edcc3f5088161445102a656ae4adb8ab1", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.5983122069335064, "ground_truth": 0}, {"key": "d79b790edcc3f5088161445102a656ae4adb8ab1", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.7057850247108691, "ground_truth": 0}, {"key": "d79b790edcc3f5088161445102a656ae4adb8ab1", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.6619228806624887, "ground_truth": 0}, {"key": "47f028dbf53e028eb6636c85d8b3ee0de6a1de7b", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.7461390082304741, "ground_truth": 0}, {"key": "47f028dbf53e028eb6636c85d8b3ee0de6a1de7b", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.6460136970180096, "ground_truth": 0}, {"key": "47f028dbf53e028eb6636c85d8b3ee0de6a1de7b", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.455198576395468, "ground_truth": 0}, {"key": "47f028dbf53e028eb6636c85d8b3ee0de6a1de7b", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.6791787227336608, "ground_truth": 0}, {"key": "47f028dbf53e028eb6636c85d8b3ee0de6a1de7b", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.7041601591777694, "ground_truth": 0}, {"key": "5f7a869908e864b70e83282b289ed1274c1f7f0d", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.23792990545831572, "ground_truth": 0}, {"key": "5f7a869908e864b70e83282b289ed1274c1f7f0d", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.4551986234242476, "ground_truth": 0}, {"key": "5f7a869908e864b70e83282b289ed1274c1f7f0d", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.4571367399046546, "ground_truth": 0}, {"key": "5f7a869908e864b70e83282b289ed1274c1f7f0d", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.16885694778464008, "ground_truth": 0}, {"key": "5f7a869908e864b70e83282b289ed1274c1f7f0d", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.32594950966147196, "ground_truth": 0}, {"key": "59a9e7cad1c4c873738dda62b7e7b39bc2553710", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.579400446149507, "ground_truth": 0}, {"key": "59a9e7cad1c4c873738dda62b7e7b39bc2553710", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.583203328980963, "ground_truth": 0}, {"key": "59a9e7cad1c4c873738dda62b7e7b39bc2553710", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.8376199720982436, "ground_truth": 0}, {"key": "59a9e7cad1c4c873738dda62b7e7b39bc2553710", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.6601723779656993, "ground_truth": 0}, {"key": "59a9e7cad1c4c873738dda62b7e7b39bc2553710", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.715423986932157, "ground_truth": 0}, {"key": "c47db89f5f9de3e599e2947ab7940eb65be0b433", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.7341195202069041, "ground_truth": 0}, {"key": "c47db89f5f9de3e599e2947ab7940eb65be0b433", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.6992544387414052, "ground_truth": 0}, {"key": "c47db89f5f9de3e599e2947ab7940eb65be0b433", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.7759445324366282, "ground_truth": 0}, {"key": "c47db89f5f9de3e599e2947ab7940eb65be0b433", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.7295197778355704, "ground_truth": 0}, {"key": "c47db89f5f9de3e599e2947ab7940eb65be0b433", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.6406358659081979, "ground_truth": 0}, {"key": "a74c3ff540cb154fc1294fd9d48b6a952329722b", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.5794003897866733, "ground_truth": 0}, {"key": "a74c3ff540cb154fc1294fd9d48b6a952329722b", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.7943849440192595, "ground_truth": 0}, {"key": "a74c3ff540cb154fc1294fd9d48b6a952329722b", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.775944539820989, "ground_truth": 0}, {"key": "a74c3ff540cb154fc1294fd9d48b6a952329722b", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.41111086463947816, "ground_truth": 0}, {"key": "a74c3ff540cb154fc1294fd9d48b6a952329722b", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.5717666067638846, "ground_truth": 0}, {"key": "f5692f8e01389a631dadcb70cfd4be3ff0ae45d3", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.9268352812220904, "ground_truth": 0}, {"key": "f5692f8e01389a631dadcb70cfd4be3ff0ae45d3", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.8774767895702953, "ground_truth": 0}, {"key": "f5692f8e01389a631dadcb70cfd4be3ff0ae45d3", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.7892337116376843, "ground_truth": 0}, {"key": "f5692f8e01389a631dadcb70cfd4be3ff0ae45d3", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.8092759836722094, "ground_truth": 0}, {"key": "f5692f8e01389a631dadcb70cfd4be3ff0ae45d3", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.8991213807177252, "ground_truth": 0}, {"key": "467e1b592518a5660d0a3b7eda24ef9574fe0d11", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.6315942965813615, "ground_truth": 0}, {"key": "467e1b592518a5660d0a3b7eda24ef9574fe0d11", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.5058591475849525, "ground_truth": 0}, {"key": "467e1b592518a5660d0a3b7eda24ef9574fe0d11", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.6859494448201473, "ground_truth": 0}, {"key": "467e1b592518a5660d0a3b7eda24ef9574fe0d11", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.5506073800068229, "ground_truth": 0}, {"key": "467e1b592518a5660d0a3b7eda24ef9574fe0d11", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.7041601215920076, "ground_truth": 0}, {"key": "61acf6de75325370728f6e290bafb01adc24a3ca", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.23792989735683182, "ground_truth": 0}, {"key": "61acf6de75325370728f6e290bafb01adc24a3ca", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.2751297169037824, "ground_truth": 0}, {"key": "61acf6de75325370728f6e290bafb01adc24a3ca", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.4320633954579847, "ground_truth": 0}, {"key": "61acf6de75325370728f6e290bafb01adc24a3ca", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.24077458893325948, "ground_truth": 0}, {"key": "61acf6de75325370728f6e290bafb01adc24a3ca", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.45326185616419057, "ground_truth": 0}, {"key": "172d2668b011501c20181b4925ebb6ba582f9a2f", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.7122321899176116, "ground_truth": 0}, {"key": "172d2668b011501c20181b4925ebb6ba582f9a2f", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.6132365602404515, "ground_truth": 0}, {"key": "172d2668b011501c20181b4925ebb6ba582f9a2f", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.4746311778093789, "ground_truth": 0}, {"key": "172d2668b011501c20181b4925ebb6ba582f9a2f", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.5467381583793921, "ground_truth": 0}, {"key": "172d2668b011501c20181b4925ebb6ba582f9a2f", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.6671476673802985, "ground_truth": 0}, {"key": "314c7c0104eb4113074619b3b3f1e9356114e2f5", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.9385759589688986, "ground_truth": 0}, {"key": "314c7c0104eb4113074619b3b3f1e9356114e2f5", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.9136765306102229, "ground_truth": 0}, {"key": "314c7c0104eb4113074619b3b3f1e9356114e2f5", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.9219218333126916, "ground_truth": 0}, {"key": "314c7c0104eb4113074619b3b3f1e9356114e2f5", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.8940517115082286, "ground_truth": 0}, {"key": "314c7c0104eb4113074619b3b3f1e9356114e2f5", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.9019206684439998, "ground_truth": 0}, {"key": "e66546893c2fa5fe38be74e1d1ed104f0c412b4d", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.6893056233248699, "ground_truth": 0}, {"key": "e66546893c2fa5fe38be74e1d1ed104f0c412b4d", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.7577943824735034, "ground_truth": 0}, {"key": "e66546893c2fa5fe38be74e1d1ed104f0c412b4d", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.40733342207892903, "ground_truth": 0}, {"key": "e66546893c2fa5fe38be74e1d1ed104f0c412b4d", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.7090191229398766, "ground_truth": 0}, {"key": "e66546893c2fa5fe38be74e1d1ed104f0c412b4d", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.4225046029280549, "ground_truth": 0}, {"key": "04882672036936ca86bdebed819a133539cbd296", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.7201715045491702, "ground_truth": 0}, {"key": "04882672036936ca86bdebed819a133539cbd296", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.38861802047614635, "ground_truth": 0}, {"key": "04882672036936ca86bdebed819a133539cbd296", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.4416730231483707, "ground_truth": 0}, {"key": "04882672036936ca86bdebed819a133539cbd296", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.5039061594688894, "ground_truth": 0}, {"key": "04882672036936ca86bdebed819a133539cbd296", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.3923368242275857, "ground_truth": 0}, {"key": "d5342fb6d8d522f336f2ce34eaa6e62446c0da2e", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.4359015373849089, "ground_truth": 0}, {"key": "d5342fb6d8d522f336f2ce34eaa6e62446c0da2e", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.45907614435826166, "ground_truth": 0}, {"key": "d5342fb6d8d522f336f2ce34eaa6e62446c0da2e", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.43014734810471716, "ground_truth": 0}, {"key": "d5342fb6d8d522f336f2ce34eaa6e62446c0da2e", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.37387582466512764, "ground_truth": 0}, {"key": "d5342fb6d8d522f336f2ce34eaa6e62446c0da2e", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.7786493079299445, "ground_truth": 0}, {"key": "87cdc5b797032387ea9bd0c9a0d7fd57c088e65b", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.3451052802055259, "ground_truth": 0}, {"key": "87cdc5b797032387ea9bd0c9a0d7fd57c088e65b", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.4416729924147392, "ground_truth": 0}, {"key": "87cdc5b797032387ea9bd0c9a0d7fd57c088e65b", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.432063392426784, "ground_truth": 0}, {"key": "87cdc5b797032387ea9bd0c9a0d7fd57c088e65b", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.6352224603206784, "ground_truth": 0}, {"key": "87cdc5b797032387ea9bd0c9a0d7fd57c088e65b", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.6039318345984224, "ground_truth": 0}, {"key": "4fd3285b643696cd49f08c14b0d482e559f32eed", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.6548947352341451, "ground_truth": 0}, {"key": "4fd3285b643696cd49f08c14b0d482e559f32eed", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.7826624802854039, "ground_truth": 0}, {"key": "4fd3285b643696cd49f08c14b0d482e559f32eed", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.5794003842235628, "ground_truth": 0}, {"key": "4fd3285b643696cd49f08c14b0d482e559f32eed", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.6113819772153543, "ground_truth": 0}, {"key": "4fd3285b643696cd49f08c14b0d482e559f32eed", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.5679366119511566, "ground_truth": 0}, {"key": "55930649e6f3cb285a26ef33525f8199bd86d089", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.295839855514631, "ground_truth": 0}, {"key": "55930649e6f3cb285a26ef33525f8199bd86d089", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.585101160947332, "ground_truth": 0}, {"key": "55930649e6f3cb285a26ef33525f8199bd86d089", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.3468730661062416, "ground_truth": 0}, {"key": "55930649e6f3cb285a26ef33525f8199bd86d089", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.2909808732642252, "ground_truth": 0}, {"key": "55930649e6f3cb285a26ef33525f8199bd86d089", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.22541660220132442, "ground_truth": 0}, {"key": "8b1c9d7c48a0d857ae857a21395a4996de051915", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.40544875011839515, "ground_truth": 0}, {"key": "8b1c9d7c48a0d857ae857a21395a4996de051915", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.5794004009818434, "ground_truth": 0}, {"key": "8b1c9d7c48a0d857ae857a21395a4996de051915", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.4629586124909237, "ground_truth": 0}, {"key": "8b1c9d7c48a0d857ae857a21395a4996de051915", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.4843800805681707, "ground_truth": 0}, {"key": "8b1c9d7c48a0d857ae857a21395a4996de051915", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.28776781904166737, "ground_truth": 0}, {"key": "d95dce003f0fccc57742bd900c81897c45208c10", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.7490872106553709, "ground_truth": 0}, {"key": "d95dce003f0fccc57742bd900c81897c45208c10", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.4707366033483467, "ground_truth": 0}, {"key": "d95dce003f0fccc57742bd900c81897c45208c10", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.6926419956072433, "ground_truth": 0}, {"key": "d95dce003f0fccc57742bd900c81897c45208c10", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.540923863261799, "ground_truth": 0}, {"key": "d95dce003f0fccc57742bd900c81897c45208c10", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.46295860944442635, "ground_truth": 0}, {"key": "f732a658c314c090257225483075e4d9fde28b95", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.8577681031603642, "ground_truth": 0}, {"key": "f732a658c314c090257225483075e4d9fde28b95", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.9515039946966738, "ground_truth": 0}, {"key": "f732a658c314c090257225483075e4d9fde28b95", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.9462003550503473, "ground_truth": 0}, {"key": "f732a658c314c090257225483075e4d9fde28b95", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.9019206733490044, "ground_truth": 0}, {"key": "f732a658c314c090257225483075e4d9fde28b95", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.9252299527773189, "ground_truth": 0}, {"key": "cbd21ed724b7e4a075ab4ae9a45d9e86d6151283", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.49218810878649283, "ground_truth": 0}, {"key": "cbd21ed724b7e4a075ab4ae9a45d9e86d6151283", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.6842640161606112, "ground_truth": 0}, {"key": "cbd21ed724b7e4a075ab4ae9a45d9e86d6151283", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.46684559784921087, "ground_truth": 0}, {"key": "cbd21ed724b7e4a075ab4ae9a45d9e86d6151283", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.34158250986595784, "ground_truth": 0}, {"key": "cbd21ed724b7e4a075ab4ae9a45d9e86d6151283", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.6477982151757637, "ground_truth": 0}, {"key": "4a32d5f29cfb35f3a3966ee041fc1f358503f4b4", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.8670357612179653, "ground_truth": 0}, {"key": "4a32d5f29cfb35f3a3966ee041fc1f358503f4b4", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.9278877965472625, "ground_truth": 0}, {"key": "4a32d5f29cfb35f3a3966ee041fc1f358503f4b4", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.8998277822677984, "ground_truth": 0}, {"key": "4a32d5f29cfb35f3a3966ee041fc1f358503f4b4", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.9445872056073805, "ground_truth": 0}, {"key": "4a32d5f29cfb35f3a3966ee041fc1f358503f4b4", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.9319595868038177, "ground_truth": 0}, {"key": "d470c9860671ae720ccc7df115a46d471b4b900a", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.9788748057903072, "ground_truth": 0}, {"key": "d470c9860671ae720ccc7df115a46d471b4b900a", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.9190632872279605, "ground_truth": 0}, {"key": "d470c9860671ae720ccc7df115a46d471b4b900a", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.9252299528835608, "ground_truth": 0}, {"key": "d470c9860671ae720ccc7df115a46d471b4b900a", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.9449947132047262, "ground_truth": 0}, {"key": "d470c9860671ae720ccc7df115a46d471b4b900a", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.9449947191282605, "ground_truth": 0}, {"key": "55327ce32c4d5168e8e0fa7b5dabc9a8aafd9d78", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.5136684485641237, "ground_truth": 0}, {"key": "55327ce32c4d5168e8e0fa7b5dabc9a8aafd9d78", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.441673022788194, "ground_truth": 0}, {"key": "55327ce32c4d5168e8e0fa7b5dabc9a8aafd9d78", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.3345894455607338, "ground_truth": 0}, {"key": "55327ce32c4d5168e8e0fa7b5dabc9a8aafd9d78", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.598312203329809, "ground_truth": 0}, {"key": "55327ce32c4d5168e8e0fa7b5dabc9a8aafd9d78", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.34334172755793574, "ground_truth": 0}, {"key": "022c18def42072e28a37979c622c6ab7e31371de", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.5679365951917357, "ground_truth": 0}, {"key": "022c18def42072e28a37979c622c6ab7e31371de", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.7826624895233378, "ground_truth": 0}, {"key": "022c18def42072e28a37979c622c6ab7e31371de", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.6095241592583639, "ground_truth": 0}, {"key": "022c18def42072e28a37979c622c6ab7e31371de", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.6388352785881074, "ground_truth": 0}, {"key": "022c18def42072e28a37979c622c6ab7e31371de", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.6095241652591261, "ground_truth": 0}, {"key": "d49c8ddc7586fcc27a7d310a5cb7703f19e4607d", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.8210440955485545, "ground_truth": 0}, {"key": "d49c8ddc7586fcc27a7d310a5cb7703f19e4607d", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.752012590682584, "ground_truth": 0}, {"key": "d49c8ddc7586fcc27a7d310a5cb7703f19e4607d", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.8019358282733678, "ground_truth": 0}, {"key": "d49c8ddc7586fcc27a7d310a5cb7703f19e4607d", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.8783142486803788, "ground_truth": 0}, {"key": "d49c8ddc7586fcc27a7d310a5cb7703f19e4607d", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.9073122190397104, "ground_truth": 0}, {"key": "bda116dccb075585a67fd5dd5b759015c7577eb0", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.7718434941890595, "ground_truth": 0}, {"key": "bda116dccb075585a67fd5dd5b759015c7577eb0", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.8479677621273322, "ground_truth": 0}, {"key": "bda116dccb075585a67fd5dd5b759015c7577eb0", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.882427862872195, "ground_truth": 0}, {"key": "bda116dccb075585a67fd5dd5b759015c7577eb0", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.8740772349581982, "ground_truth": 0}, {"key": "bda116dccb075585a67fd5dd5b759015c7577eb0", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.9026096030926882, "ground_truth": 0}, {"key": "ee0b1bc5ee40697c0792e3906000fe8be5be182a", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.6723316976492321, "ground_truth": 0}, {"key": "ee0b1bc5ee40697c0792e3906000fe8be5be182a", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.5698526262532739, "ground_truth": 0}, {"key": "ee0b1bc5ee40697c0792e3906000fe8be5be182a", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.6150878692083368, "ground_truth": 0}, {"key": "ee0b1bc5ee40697c0792e3906000fe8be5be182a", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.8092759720071468, "ground_truth": 0}, {"key": "ee0b1bc5ee40697c0792e3906000fe8be5be182a", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.5544704478056997, "ground_truth": 0}, {"key": "75b0d4c21581a1b0c1fc5798adba334d8ecc34f3", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.5350984159861507, "ground_truth": 0}, {"key": "75b0d4c21581a1b0c1fc5798adba334d8ecc34f3", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.49023561630144896, "ground_truth": 0}, {"key": "75b0d4c21581a1b0c1fc5798adba334d8ecc34f3", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.4668456033220036, "ground_truth": 0}, {"key": "75b0d4c21581a1b0c1fc5798adba334d8ecc34f3", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.46879063298692103, "ground_truth": 0}, {"key": "75b0d4c21581a1b0c1fc5798adba334d8ecc34f3", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.5717665999711445, "ground_truth": 0}, {"key": "3f7e19cffef13f356e2298c5a63e6c8db20f3d91", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.5350984205639402, "ground_truth": 0}, {"key": "3f7e19cffef13f356e2298c5a63e6c8db20f3d91", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.6020615850086726, "ground_truth": 0}, {"key": "3f7e19cffef13f356e2298c5a63e6c8db20f3d91", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.8221891245504729, "ground_truth": 0}, {"key": "3f7e19cffef13f356e2298c5a63e6c8db20f3d91", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.6315943225986472, "ground_truth": 0}, {"key": "3f7e19cffef13f356e2298c5a63e6c8db20f3d91", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.5525396896996262, "ground_truth": 0}, {"key": "00359f516cdf8b1800c7102711bd9aa400d1c749", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.5583269886423448, "ground_truth": 0}, {"key": "00359f516cdf8b1800c7102711bd9aa400d1c749", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.5253688252916116, "ground_truth": 0}, {"key": "00359f516cdf8b1800c7102711bd9aa400d1c749", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.596433116833408, "ground_truth": 0}, {"key": "00359f516cdf8b1800c7102711bd9aa400d1c749", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.47073660498557796, "ground_truth": 0}, {"key": "00359f516cdf8b1800c7102711bd9aa400d1c749", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.7461389844516577, "ground_truth": 0}, {"key": "f8be2f5ce06cb4af91cbb7b6bef9835991751ef5", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.6636689624901598, "ground_truth": 0}, {"key": "f8be2f5ce06cb4af91cbb7b6bef9835991751ef5", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.4668456174871059, "ground_truth": 0}, {"key": "f8be2f5ce06cb4af91cbb7b6bef9835991751ef5", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.4513265267032203, "ground_truth": 0}, {"key": "f8be2f5ce06cb4af91cbb7b6bef9835991751ef5", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.40922078250161564, "ground_truth": 0}, {"key": "f8be2f5ce06cb4af91cbb7b6bef9835991751ef5", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.61323656610961, "ground_truth": 0}, {"key": "958a67b8550998886478275b404e2256a6b85c7c", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.45907612229614286, "ground_truth": 0}, {"key": "958a67b8550998886478275b404e2256a6b85c7c", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.3611647166513807, "ground_truth": 0}, {"key": "958a67b8550998886478275b404e2256a6b85c7c", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.6297746054672354, "ground_truth": 0}, {"key": "958a67b8550998886478275b404e2256a6b85c7c", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.27825680898139066, "ground_truth": 0}, {"key": "958a67b8550998886478275b404e2256a6b85c7c", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.5195213345644968, "ground_truth": 0}, {"key": "4739f160c87994f52e894591194f5df06fed4c39", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.5851011431044209, "ground_truth": 0}, {"key": "4739f160c87994f52e894591194f5df06fed4c39", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.6671476864801171, "ground_truth": 0}, {"key": "4739f160c87994f52e894591194f5df06fed4c39", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.6566582588803962, "ground_truth": 0}, {"key": "4739f160c87994f52e894591194f5df06fed4c39", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.7592254056382614, "ground_truth": 0}, {"key": "4739f160c87994f52e894591194f5df06fed4c39", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.8267117942181442, "ground_truth": 0}, {"key": "027a99a889b38fdb935cd14c204a5fca8a329bc1", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.4397473475065745, "ground_truth": 0}, {"key": "027a99a889b38fdb935cd14c204a5fca8a329bc1", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.5660185329285665, "ground_truth": 0}, {"key": "027a99a889b38fdb935cd14c204a5fca8a329bc1", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.5794004123520758, "ground_truth": 0}, {"key": "027a99a889b38fdb935cd14c204a5fca8a329bc1", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.7592254199399597, "ground_truth": 0}, {"key": "027a99a889b38fdb935cd14c204a5fca8a329bc1", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.7217432006689944, "ground_truth": 0}, {"key": "c7c83a9ee902e568a55898c616f20181952ce057", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.583203336130392, "ground_truth": 0}, {"key": "c7c83a9ee902e568a55898c616f20181952ce057", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.6791786826170875, "ground_truth": 0}, {"key": "c7c83a9ee902e568a55898c616f20181952ce057", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.4301473341028354, "ground_truth": 0}, {"key": "c7c83a9ee902e568a55898c616f20181952ce057", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.6169358114710042, "ground_truth": 0}, {"key": "c7c83a9ee902e568a55898c616f20181952ce057", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.7170118704286705, "ground_truth": 0}, {"key": "7bff6a60ff0b62855bd28562bb820233c0c940e0", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.8519528010463977, "ground_truth": 0}, {"key": "7bff6a60ff0b62855bd28562bb820233c0c940e0", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.6723316956745639, "ground_truth": 0}, {"key": "7bff6a60ff0b62855bd28562bb820233c0c940e0", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.5640984770685571, "ground_truth": 0}, {"key": "7bff6a60ff0b62855bd28562bb820233c0c940e0", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.8661325218492801, "ground_truth": 0}, {"key": "7bff6a60ff0b62855bd28562bb820233c0c940e0", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.6187804420574574, "ground_truth": 0}, {"key": "5ba5e49e25610f42416b2e7ba76d7496acab0f78", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.5774953748271929, "ground_truth": 0}, {"key": "5ba5e49e25610f42416b2e7ba76d7496acab0f78", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.38121957635469633, "ground_truth": 0}, {"key": "5ba5e49e25610f42416b2e7ba76d7496acab0f78", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.6876299925987879, "ground_truth": 0}, {"key": "5ba5e49e25610f42416b2e7ba76d7496acab0f78", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.7772998682772688, "ground_truth": 0}, {"key": "5ba5e49e25610f42416b2e7ba76d7496acab0f78", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.70740469765363, "ground_truth": 0}, {"key": "0961a6a9fef7ad978ab866a57415578a49ba187f", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.39047584639028354, "ground_truth": 0}, {"key": "0961a6a9fef7ad978ab866a57415578a49ba187f", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.4035668635500811, "ground_truth": 0}, {"key": "0961a6a9fef7ad978ab866a57415578a49ba187f", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.5039061636634911, "ground_truth": 0}, {"key": "0961a6a9fef7ad978ab866a57415578a49ba187f", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.5019531136387372, "ground_truth": 0}, {"key": "0961a6a9fef7ad978ab866a57415578a49ba187f", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.6020615722668535, "ground_truth": 0}, {"key": "94148575d23050ffbedb00bddbd826d7137a4fe4", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.5273165294773754, "ground_truth": 0}, {"key": "94148575d23050ffbedb00bddbd826d7137a4fe4", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.7008948058563579, "ground_truth": 0}, {"key": "94148575d23050ffbedb00bddbd826d7137a4fe4", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.8807970788879201, "ground_truth": 0}, {"key": "94148575d23050ffbedb00bddbd826d7137a4fe4", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.6909762829476613, "ground_truth": 0}, {"key": "94148575d23050ffbedb00bddbd826d7137a4fe4", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.700894820169963, "ground_truth": 0}, {"key": "aaa346e0be1ef1b9c2ce152c859b30e364ea3bc0", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.8955226797207386, "ground_truth": 0}, {"key": "aaa346e0be1ef1b9c2ce152c859b30e364ea3bc0", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.7994423163355739, "ground_truth": 0}, {"key": "aaa346e0be1ef1b9c2ce152c859b30e364ea3bc0", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.9099069991789898, "ground_truth": 0}, {"key": "aaa346e0be1ef1b9c2ce152c859b30e364ea3bc0", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.8233283916123755, "ground_truth": 0}, {"key": "aaa346e0be1ef1b9c2ce152c859b30e364ea3bc0", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.874077227627281, "ground_truth": 0}, {"key": "7604af04967436c4aaf0c7df8b09afcec82f5be0", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.355774863943437, "ground_truth": 0}, {"key": "7604af04967436c4aaf0c7df8b09afcec82f5be0", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.6859494461202711, "ground_truth": 0}, {"key": "7604af04967436c4aaf0c7df8b09afcec82f5be0", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.5794004034430662, "ground_truth": 0}, {"key": "7604af04967436c4aaf0c7df8b09afcec82f5be0", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.5679366029784172, "ground_truth": 0}, {"key": "7604af04967436c4aaf0c7df8b09afcec82f5be0", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.6113819695310266, "ground_truth": 0}, {"key": "1be68b94413120c0b2c7514ffd14b9cfc4413f90", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.7310586012231631, "ground_truth": 0}, {"key": "1be68b94413120c0b2c7514ffd14b9cfc4413f90", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.6352224310934648, "ground_truth": 0}, {"key": "1be68b94413120c0b2c7514ffd14b9cfc4413f90", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.7138307306849813, "ground_truth": 0}, {"key": "1be68b94413120c0b2c7514ffd14b9cfc4413f90", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.37570649049374705, "ground_truth": 0}, {"key": "1be68b94413120c0b2c7514ffd14b9cfc4413f90", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.5136684826773592, "ground_truth": 0}, {"key": "44fc3a2bc441a674f1ebdeabae73278977909db4", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.6943026661166557, "ground_truth": 0}, {"key": "44fc3a2bc441a674f1ebdeabae73278977909db4", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.6992543997565627, "ground_truth": 0}, {"key": "44fc3a2bc441a674f1ebdeabae73278977909db4", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.7577943476714877, "ground_truth": 0}, {"key": "44fc3a2bc441a674f1ebdeabae73278977909db4", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.6076631572572553, "ground_truth": 0}, {"key": "44fc3a2bc441a674f1ebdeabae73278977909db4", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.7295197903686901, "ground_truth": 0}, {"key": "fbb06b75e3963c5a810c9f73e4dc5382fbcb7405", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.7170118731184021, "ground_truth": 0}, {"key": "fbb06b75e3963c5a810c9f73e4dc5382fbcb7405", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.6279512144598696, "ground_truth": 0}, {"key": "fbb06b75e3963c5a810c9f73e4dc5382fbcb7405", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.8044059245557884, "ground_truth": 0}, {"key": "fbb06b75e3963c5a810c9f73e4dc5382fbcb7405", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.6352224435177796, "ground_truth": 0}, {"key": "fbb06b75e3963c5a810c9f73e4dc5382fbcb7405", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.618780421769891, "ground_truth": 0}, {"key": "551839469c1133ef4697ed435c5de192e6076858", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.8187367968487782, "ground_truth": 0}, {"key": "551839469c1133ef4697ed435c5de192e6076858", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.7786493034139891, "ground_truth": 0}, {"key": "551839469c1133ef4697ed435c5de192e6076858", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.7853085824706972, "ground_truth": 0}, {"key": "551839469c1133ef4697ed435c5de192e6076858", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.6169358294384218, "ground_truth": 0}, {"key": "551839469c1133ef4697ed435c5de192e6076858", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.7201715009814511, "ground_truth": 0}, {"key": "386e149797954c4b5cd52bcad0beece29f7eb04a", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.8459424369069356, "ground_truth": 0}, {"key": "386e149797954c4b5cd52bcad0beece29f7eb04a", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.6976089201415189, "ground_truth": 0}, {"key": "386e149797954c4b5cd52bcad0beece29f7eb04a", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.9032942080367806, "ground_truth": 0}, {"key": "386e149797954c4b5cd52bcad0beece29f7eb04a", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.8233283954469365, "ground_truth": 0}, {"key": "386e149797954c4b5cd52bcad0beece29f7eb04a", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.8289388145620047, "ground_truth": 0}, {"key": "25abfd6bf83eb62bdd4daf1f542d61b54ab2871d", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.909264502201397, "ground_truth": 0}, {"key": "25abfd6bf83eb62bdd4daf1f542d61b54ab2871d", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.7446563605080889, "ground_truth": 0}, {"key": "25abfd6bf83eb62bdd4daf1f542d61b54ab2871d", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.8740772355176505, "ground_truth": 0}, {"key": "25abfd6bf83eb62bdd4daf1f542d61b54ab2871d", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.8902942311903396, "ground_truth": 0}, {"key": "25abfd6bf83eb62bdd4daf1f542d61b54ab2871d", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.8152324784769667, "ground_truth": 0}, {"key": "e5e0f9ea6381d513d4632644634d7c12e1c6c4cb", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.738669058866673, "ground_truth": 0}, {"key": "e5e0f9ea6381d513d4632644634d7c12e1c6c4cb", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.7799929071875586, "ground_truth": 0}, {"key": "e5e0f9ea6381d513d4632644634d7c12e1c6c4cb", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.8006919845335475, "ground_truth": 0}, {"key": "e5e0f9ea6381d513d4632644634d7c12e1c6c4cb", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.7648916100527353, "ground_truth": 0}, {"key": "e5e0f9ea6381d513d4632644634d7c12e1c6c4cb", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.3886180276403693, "ground_truth": 0}, {"key": "4e660c57fb36c03622b3ff9f9d0e78a0f7b0aea9", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.5736784005759926, "ground_truth": 0}, {"key": "4e660c57fb36c03622b3ff9f9d0e78a0f7b0aea9", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.6206216016501866, "ground_truth": 0}, {"key": "4e660c57fb36c03622b3ff9f9d0e78a0f7b0aea9", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.29583987058108807, "ground_truth": 0}, {"key": "4e660c57fb36c03622b3ff9f9d0e78a0f7b0aea9", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.562176493311061, "ground_truth": 0}, {"key": "4e660c57fb36c03622b3ff9f9d0e78a0f7b0aea9", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.32939172255283306, "ground_truth": 0}, {"key": "586458cf89c9c2ddc5a7925e275f135245f5a0fc", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.8449215167273113, "ground_truth": 0}, {"key": "586458cf89c9c2ddc5a7925e275f135245f5a0fc", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.925229947724176, "ground_truth": 0}, {"key": "586458cf89c9c2ddc5a7925e275f135245f5a0fc", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.7662936538741153, "ground_truth": 0}, {"key": "586458cf89c9c2ddc5a7925e275f135245f5a0fc", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.9235923214733671, "ground_truth": 0}, {"key": "586458cf89c9c2ddc5a7925e275f135245f5a0fc", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.874934618949567, "ground_truth": 0}, {"key": "8aca433d3662b6ffe76ef4026bdcd7cf784aacec", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.5679365993948039, "ground_truth": 0}, {"key": "8aca433d3662b6ffe76ef4026bdcd7cf784aacec", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.279828487186215, "ground_truth": 0}, {"key": "8aca433d3662b6ffe76ef4026bdcd7cf784aacec", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.4707366055713025, "ground_truth": 0}, {"key": "8aca433d3662b6ffe76ef4026bdcd7cf784aacec", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.3123699839895782, "ground_truth": 0}, {"key": "8aca433d3662b6ffe76ef4026bdcd7cf784aacec", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.37570647569678284, "ground_truth": 0}, {"key": "066f8568d9c1c23ca3aeb23330123e7dd8967208", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.9372107952767732, "ground_truth": 0}, {"key": "066f8568d9c1c23ca3aeb23330123e7dd8967208", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.8918110526506178, "ground_truth": 0}, {"key": "066f8568d9c1c23ca3aeb23330123e7dd8967208", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.7106283046632073, "ground_truth": 0}, {"key": "066f8568d9c1c23ca3aeb23330123e7dd8967208", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.9190632916191439, "ground_truth": 0}, {"key": "066f8568d9c1c23ca3aeb23330123e7dd8967208", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.7279754477431731, "ground_truth": 0}, {"key": "6589398915f67576609586704d5bcca6538c4727", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.9079671373585794, "ground_truth": 0}, {"key": "6589398915f67576609586704d5bcca6538c4727", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.8816149046320148, "ground_truth": 0}, {"key": "6589398915f67576609586704d5bcca6538c4727", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.8918110449069644, "ground_truth": 0}, {"key": "6589398915f67576609586704d5bcca6538c4727", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.9489172634031904, "ground_truth": 0}, {"key": "6589398915f67576609586704d5bcca6538c4727", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.8428631639210077, "ground_truth": 0}, {"key": "cb4d9818866490b281e8f5529c9957ba366390e7", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.5, "ground_truth": 0}, {"key": "cb4d9818866490b281e8f5529c9957ba366390e7", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.4455295232592027, "ground_truth": 0}, {"key": "cb4d9818866490b281e8f5529c9957ba366390e7", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.5019531162306203, "ground_truth": 0}, {"key": "cb4d9818866490b281e8f5529c9957ba366390e7", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.38121957338355716, "ground_truth": 0}, {"key": "cb4d9818866490b281e8f5529c9957ba366390e7", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.556399584146005, "ground_truth": 0}, {"key": "83181eb5628b02f9af1cf8be0b9e3d7841f6f94c", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.5945512601964976, "ground_truth": 0}, {"key": "83181eb5628b02f9af1cf8be0b9e3d7841f6f94c", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.6976089223246726, "ground_truth": 0}, {"key": "83181eb5628b02f9af1cf8be0b9e3d7841f6f94c", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.6370307902559043, "ground_truth": 0}, {"key": "83181eb5628b02f9af1cf8be0b9e3d7841f6f94c", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.7563575683449234, "ground_truth": 0}, {"key": "83181eb5628b02f9af1cf8be0b9e3d7841f6f94c", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.7461390287430428, "ground_truth": 0}, {"key": "addda21620885e1019305bce0cbf308b421dc0ba", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.4765796428308618, "ground_truth": 0}, {"key": "addda21620885e1019305bce0cbf308b421dc0ba", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.29910517849886786, "ground_truth": 0}, {"key": "addda21620885e1019305bce0cbf308b421dc0ba", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.346873080738063, "ground_truth": 0}, {"key": "addda21620885e1019305bce0cbf308b421dc0ba", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.5253688173116673, "ground_truth": 0}, {"key": "addda21620885e1019305bce0cbf308b421dc0ba", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.3468730797525608, "ground_truth": 0}, {"key": "6a0a6f44de4059e1d7ef83841b3fd5e95e278ba2", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.5660185405429731, "ground_truth": 0}, {"key": "6a0a6f44de4059e1d7ef83841b3fd5e95e278ba2", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.29910518818289655, "ground_truth": 0}, {"key": "6a0a6f44de4059e1d7ef83841b3fd5e95e278ba2", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.6926419781959556, "ground_truth": 0}, {"key": "6a0a6f44de4059e1d7ef83841b3fd5e95e278ba2", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.8418256614443178, "ground_truth": 0}, {"key": "6a0a6f44de4059e1d7ef83841b3fd5e95e278ba2", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.4378235099887696, "ground_truth": 0}, {"key": "b5313efdec6d9afa6f43f26378c6065fcc9c7535", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.7981867767679571, "ground_truth": 0}, {"key": "b5313efdec6d9afa6f43f26378c6065fcc9c7535", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.7759445638924684, "ground_truth": 0}, {"key": "b5313efdec6d9afa6f43f26378c6065fcc9c7535", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.5621764971175199, "ground_truth": 0}, {"key": "b5313efdec6d9afa6f43f26378c6065fcc9c7535", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.7648916159509636, "ground_truth": 0}, {"key": "b5313efdec6d9afa6f43f26378c6065fcc9c7535", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.7295197852297819, "ground_truth": 0}, {"key": "0644f27692b67af8f52f9518e29981de11684cd7", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.9635062332179549, "ground_truth": 0}, {"key": "0644f27692b67af8f52f9518e29981de11684cd7", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.9235923170743033, "ground_truth": 0}, {"key": "0644f27692b67af8f52f9518e29981de11684cd7", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.9167080758429451, "ground_truth": 0}, {"key": "0644f27692b67af8f52f9518e29981de11684cd7", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.8807970722749761, "ground_truth": 0}, {"key": "0644f27692b67af8f52f9518e29981de11684cd7", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.935346510122874, "ground_truth": 0}, {"key": "19dbfe3918d9bdd7b5f1792631c5e3e424146473", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.7981867750544933, "ground_truth": 0}, {"key": "19dbfe3918d9bdd7b5f1792631c5e3e424146473", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.843895095108932, "ground_truth": 0}, {"key": "19dbfe3918d9bdd7b5f1792631c5e3e424146473", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.5755880007768786, "ground_truth": 0}, {"key": "19dbfe3918d9bdd7b5f1792631c5e3e424146473", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.4225046346014893, "ground_truth": 0}, {"key": "19dbfe3918d9bdd7b5f1792631c5e3e424146473", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.8643104480635305, "ground_truth": 0}, {"key": "0f4fcaf8fd58c40bc31c4715cd230bb0f80f2d98", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.37387582721417645, "ground_truth": 0}, {"key": "0f4fcaf8fd58c40bc31c4715cd230bb0f80f2d98", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.5175709222172236, "ground_truth": 0}, {"key": "0f4fcaf8fd58c40bc31c4715cd230bb0f80f2d98", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.494140886695887, "ground_truth": 0}, {"key": "0f4fcaf8fd58c40bc31c4715cd230bb0f80f2d98", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.20689404706043302, "ground_truth": 0}, {"key": "0f4fcaf8fd58c40bc31c4715cd230bb0f80f2d98", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.4035668491783084, "ground_truth": 0}, {"key": "4aa90d4a364e8bd252a2a2e57f1bb4c9dab57062", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.5214711456760172, "ground_truth": 0}, {"key": "4aa90d4a364e8bd252a2a2e57f1bb4c9dab57062", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.37022537667227434, "ground_truth": 0}, {"key": "4aa90d4a364e8bd252a2a2e57f1bb4c9dab57062", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.43398146514507335, "ground_truth": 0}, {"key": "4aa90d4a364e8bd252a2a2e57f1bb4c9dab57062", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.22541660859571172, "ground_truth": 0}, {"key": "4aa90d4a364e8bd252a2a2e57f1bb4c9dab57062", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.2845760074170318, "ground_truth": 0}, {"key": "239d0e3b504e4b9e1e6eb20eb77c8a873a2f5657", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.7759445510326205, "ground_truth": 0}, {"key": "239d0e3b504e4b9e1e6eb20eb77c8a873a2f5657", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.5813030963188905, "ground_truth": 0}, {"key": "239d0e3b504e4b9e1e6eb20eb77c8a873a2f5657", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.7490872391478748, "ground_truth": 0}, {"key": "239d0e3b504e4b9e1e6eb20eb77c8a873a2f5657", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.7704648022972274, "ground_truth": 0}, {"key": "239d0e3b504e4b9e1e6eb20eb77c8a873a2f5657", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.8322366535539141, "ground_truth": 0}, {"key": "6ef705715b84a961f971d624e9574da6a65dd3ef", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.74908721900282, "ground_truth": 0}, {"key": "6ef705715b84a961f971d624e9574da6a65dd3ef", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.8428631435646745, "ground_truth": 0}, {"key": "6ef705715b84a961f971d624e9574da6a65dd3ef", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.8187367883618296, "ground_truth": 0}, {"key": "6ef705715b84a961f971d624e9574da6a65dd3ef", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.7505527753092567, "ground_truth": 0}, {"key": "6ef705715b84a961f971d624e9574da6a65dd3ef", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.8407825908249751, "ground_truth": 0}, {"key": "e3f24714630bd679c4b4fdb77e90f785beb1ff33", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.4320633842204837, "ground_truth": 0}, {"key": "e3f24714630bd679c4b4fdb77e90f785beb1ff33", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.6424324649332347, "ground_truth": 0}, {"key": "e3f24714630bd679c4b4fdb77e90f785beb1ff33", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.462958611736599, "ground_truth": 0}, {"key": "e3f24714630bd679c4b4fdb77e90f785beb1ff33", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.6169358120623523, "ground_truth": 0}, {"key": "e3f24714630bd679c4b4fdb77e90f785beb1ff33", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.5350984335698573, "ground_truth": 0}, {"key": "589dc58218fe8920f0949cc7af767b6daf5018bc", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.583203344155284, "ground_truth": 0}, {"key": "589dc58218fe8920f0949cc7af767b6daf5018bc", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.8354835459111226, "ground_truth": 0}, {"key": "589dc58218fe8920f0949cc7af767b6daf5018bc", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.4263215784305311, "ground_truth": 0}, {"key": "589dc58218fe8920f0949cc7af767b6daf5018bc", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.5370413857943509, "ground_truth": 0}, {"key": "589dc58218fe8920f0949cc7af767b6daf5018bc", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.8344068834567199, "ground_truth": 0}, {"key": "06254d21e94c9c0b027629a1df90298887c31f14", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.5983121794135073, "ground_truth": 0}, {"key": "06254d21e94c9c0b027629a1df90298887c31f14", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.3539863165334, "ground_truth": 0}, {"key": "06254d21e94c9c0b027629a1df90298887c31f14", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.46879062074559574, "ground_truth": 0}, {"key": "06254d21e94c9c0b027629a1df90298887c31f14", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.3611647297638214, "ground_truth": 0}, {"key": "06254d21e94c9c0b027629a1df90298887c31f14", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.603931822747902, "ground_truth": 0}, {"key": "5b93cafa2843ab23eb5baf8bb0bec93d0fc46864", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.9046505398285037, "ground_truth": 0}, {"key": "5b93cafa2843ab23eb5baf8bb0bec93d0fc46864", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.805632208373967, "ground_truth": 0}, {"key": "5b93cafa2843ab23eb5baf8bb0bec93d0fc46864", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.8697145859004268, "ground_truth": 0}, {"key": "5b93cafa2843ab23eb5baf8bb0bec93d0fc46864", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.8848377803533146, "ground_truth": 0}, {"key": "5b93cafa2843ab23eb5baf8bb0bec93d0fc46864", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.8688267856051877, "ground_truth": 0}, {"key": "22f9667453cf7ea8a39080edde645776d5edc6f7", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.2704802232747287, "ground_truth": 0}, {"key": "22f9667453cf7ea8a39080edde645776d5edc6f7", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.3468731039275479, "ground_truth": 0}, {"key": "22f9667453cf7ea8a39080edde645776d5edc6f7", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.32423539708518184, "ground_truth": 0}, {"key": "22f9667453cf7ea8a39080edde645776d5edc6f7", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.1530421502977583, "ground_truth": 0}, {"key": "22f9667453cf7ea8a39080edde645776d5edc6f7", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.33633103590543817, "ground_truth": 0}, {"key": "521fc18da417d441ba600a4abdbf279bb0c8f69d", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.5660185288401237, "ground_truth": 0}, {"key": "521fc18da417d441ba600a4abdbf279bb0c8f69d", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.7264256126891484, "ground_truth": 0}, {"key": "521fc18da417d441ba600a4abdbf279bb0c8f69d", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.7248702811020649, "ground_truth": 0}, {"key": "521fc18da417d441ba600a4abdbf279bb0c8f69d", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.7534666510015627, "ground_truth": 0}, {"key": "521fc18da417d441ba600a4abdbf279bb0c8f69d", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.7170118967334692, "ground_truth": 0}, {"key": "48fd5553806beaaa508596b0c8267a1ee703a8fe", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.575588030761553, "ground_truth": 0}, {"key": "48fd5553806beaaa508596b0c8267a1ee703a8fe", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.7041601490262702, "ground_truth": 0}, {"key": "48fd5553806beaaa508596b0c8267a1ee703a8fe", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.3775406626133313, "ground_truth": 0}, {"key": "48fd5553806beaaa508596b0c8267a1ee703a8fe", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.5525397269303794, "ground_truth": 0}, {"key": "48fd5553806beaaa508596b0c8267a1ee703a8fe", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.45132648286734545, "ground_truth": 0}, {"key": "f9b3e0253b7325cd0d37841a38c9f10a22c77c49", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.8354835546051848, "ground_truth": 0}, {"key": "f9b3e0253b7325cd0d37841a38c9f10a22c77c49", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.7520125609867765, "ground_truth": 0}, {"key": "f9b3e0253b7325cd0d37841a38c9f10a22c77c49", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.7505527512787306, "ground_truth": 0}, {"key": "f9b3e0253b7325cd0d37841a38c9f10a22c77c49", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.7981867739548888, "ground_truth": 0}, {"key": "f9b3e0253b7325cd0d37841a38c9f10a22c77c49", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.6893056389554008, "ground_truth": 0}, {"key": "3228a9d82b3829a4f09698b746db4036ebb38ad0", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.5698526356542226, "ground_truth": 0}, {"key": "3228a9d82b3829a4f09698b746db4036ebb38ad0", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.6132365608670335, "ground_truth": 0}, {"key": "3228a9d82b3829a4f09698b746db4036ebb38ad0", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.5097643721464018, "ground_truth": 0}, {"key": "3228a9d82b3829a4f09698b746db4036ebb38ad0", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.40356686865381214, "ground_truth": 0}, {"key": "3228a9d82b3829a4f09698b746db4036ebb38ad0", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.5175708628082223, "ground_truth": 0}, {"key": "ee02f2bd6eaf55c06fef208248197679d2d96897", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.600188346032519, "ground_truth": 0}, {"key": "ee02f2bd6eaf55c06fef208248197679d2d96897", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.4941408948601245, "ground_truth": 0}, {"key": "ee02f2bd6eaf55c06fef208248197679d2d96897", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.5039061528727147, "ground_truth": 0}, {"key": "ee02f2bd6eaf55c06fef208248197679d2d96897", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.501953117259765, "ground_truth": 0}, {"key": "ee02f2bd6eaf55c06fef208248197679d2d96897", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.8104788965616392, "ground_truth": 0}, {"key": "c8da607c6ffe49104ceacd4fe484581042e7f21a", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.5983122132639174, "ground_truth": 0}, {"key": "c8da607c6ffe49104ceacd4fe484581042e7f21a", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.4397473658432002, "ground_truth": 0}, {"key": "c8da607c6ffe49104ceacd4fe484581042e7f21a", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.1520322450391203, "ground_truth": 0}, {"key": "c8da607c6ffe49104ceacd4fe484581042e7f21a", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.38306418785608215, "ground_truth": 0}, {"key": "c8da607c6ffe49104ceacd4fe484581042e7f21a", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.7233094695244792, "ground_truth": 0}, {"key": "aeca50944e5a49735193304117849531fb4d667d", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.6959583281925157, "ground_truth": 0}, {"key": "aeca50944e5a49735193304117849531fb4d667d", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.3702253827948371, "ground_truth": 0}, {"key": "aeca50944e5a49735193304117849531fb4d667d", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.5175708997235414, "ground_truth": 0}, {"key": "aeca50944e5a49735193304117849531fb4d667d", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.4590761395258393, "ground_truth": 0}, {"key": "aeca50944e5a49735193304117849531fb4d667d", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.4571367311967421, "ground_truth": 0}, {"key": "301c27b4468420252a14f4c87c2b208c6b3259e1", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.27202457088950055, "ground_truth": 0}, {"key": "301c27b4468420252a14f4c87c2b208c6b3259e1", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.21469141252356044, "ground_truth": 0}, {"key": "301c27b4468420252a14f4c87c2b208c6b3259e1", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.16026603653908073, "ground_truth": 0}, {"key": "301c27b4468420252a14f4c87c2b208c6b3259e1", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.33633104807675057, "ground_truth": 0}, {"key": "301c27b4468420252a14f4c87c2b208c6b3259e1", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.322525984689301, "ground_truth": 0}, {"key": "9b5fc45f61bff9323a7744c1db605618763cb85c", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.5448013932321152, "ground_truth": 0}, {"key": "9b5fc45f61bff9323a7744c1db605618763cb85c", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.5097643827566808, "ground_truth": 0}, {"key": "9b5fc45f61bff9323a7744c1db605618763cb85c", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.21733752584949073, "ground_truth": 0}, {"key": "9b5fc45f61bff9323a7744c1db605618763cb85c", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.3328523245040571, "ground_truth": 0}, {"key": "9b5fc45f61bff9323a7744c1db605618763cb85c", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.5813030810332556, "ground_truth": 0}, {"key": "43144b95b0f947f2c6d40122fecd69ced8a4af92", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.709019140866907, "ground_truth": 0}, {"key": "43144b95b0f947f2c6d40122fecd69ced8a4af92", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.7325918434665694, "ground_truth": 0}, {"key": "43144b95b0f947f2c6d40122fecd69ced8a4af92", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.5832033700693122, "ground_truth": 0}, {"key": "43144b95b0f947f2c6d40122fecd69ced8a4af92", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.661922884015604, "ground_truth": 0}, {"key": "43144b95b0f947f2c6d40122fecd69ced8a4af92", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.6909762996959983, "ground_truth": 0}, {"key": "58b49fef1d6d2be5211848adc2882b59f043a933", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.4513265032369877, "ground_truth": 0}, {"key": "58b49fef1d6d2be5211848adc2882b59f043a933", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.5964331673042779, "ground_truth": 0}, {"key": "58b49fef1d6d2be5211848adc2882b59f043a933", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.5813030694777312, "ground_truth": 0}, {"key": "58b49fef1d6d2be5211848adc2882b59f043a933", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.5117166099616982, "ground_truth": 0}, {"key": "58b49fef1d6d2be5211848adc2882b59f043a933", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.5698526728146988, "ground_truth": 0}, {"key": "bdcc1253f679b14e54451db44f4f0e39af4bb559", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.7505527635835956, "ground_truth": 0}, {"key": "bdcc1253f679b14e54451db44f4f0e39af4bb559", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.6206215980007914, "ground_truth": 0}, {"key": "bdcc1253f679b14e54451db44f4f0e39af4bb559", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.6224593203162865, "ground_truth": 0}, {"key": "bdcc1253f679b14e54451db44f4f0e39af4bb559", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.47268347734498756, "ground_truth": 0}, {"key": "bdcc1253f679b14e54451db44f4f0e39af4bb559", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.6992544255230385, "ground_truth": 0}, {"key": "b22b1636da5dd15364b6f0c342e4ce4903e51c2a", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.8661325235930586, "ground_truth": 0}, {"key": "b22b1636da5dd15364b6f0c342e4ce4903e51c2a", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.9079671385795508, "ground_truth": 0}, {"key": "b22b1636da5dd15364b6f0c342e4ce4903e51c2a", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.7461389639490711, "ground_truth": 0}, {"key": "b22b1636da5dd15364b6f0c342e4ce4903e51c2a", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.815232489098791, "ground_truth": 0}, {"key": "b22b1636da5dd15364b6f0c342e4ce4903e51c2a", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.808067211914349, "ground_truth": 0}, {"key": "55986d11e0d0e5b031567157cf1f157610c65c31", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.74167400509452, "ground_truth": 0}, {"key": "55986d11e0d0e5b031567157cf1f157610c65c31", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.660172388021811, "ground_truth": 0}, {"key": "55986d11e0d0e5b031567157cf1f157610c65c31", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.7905303123780401, "ground_truth": 0}, {"key": "55986d11e0d0e5b031567157cf1f157610c65c31", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.7490872098707169, "ground_truth": 0}, {"key": "55986d11e0d0e5b031567157cf1f157610c65c31", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.41869689647278074, "ground_truth": 0}, {"key": "0a37124fe35e31ae9fe8dd7715aeed88002e23e9", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.3867634607524025, "ground_truth": 0}, {"key": "0a37124fe35e31ae9fe8dd7715aeed88002e23e9", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.2991051985316168, "ground_truth": 0}, {"key": "0a37124fe35e31ae9fe8dd7715aeed88002e23e9", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.7264256076021168, "ground_truth": 0}, {"key": "0a37124fe35e31ae9fe8dd7715aeed88002e23e9", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.7745833994198826, "ground_truth": 0}, {"key": "0a37124fe35e31ae9fe8dd7715aeed88002e23e9", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.7170119011869469, "ground_truth": 0}, {"key": "ef3ee3ab85ed8802b6b76444bccb46256077963e", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.36296918771986353, "ground_truth": 0}, {"key": "ef3ee3ab85ed8802b6b76444bccb46256077963e", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.22405547001311385, "ground_truth": 0}, {"key": "ef3ee3ab85ed8802b6b76444bccb46256077963e", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.2081789220819485, "ground_truth": 0}, {"key": "ef3ee3ab85ed8802b6b76444bccb46256077963e", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.34687308008234985, "ground_truth": 0}, {"key": "ef3ee3ab85ed8802b6b76444bccb46256077963e", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.38491214154335396, "ground_truth": 0}, {"key": "fb17ac082bd3f3af3dad8c8d36d9ea56360c520e", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.7431680038427304, "ground_truth": 0}, {"key": "fb17ac082bd3f3af3dad8c8d36d9ea56360c520e", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.6808786103666209, "ground_truth": 0}, {"key": "fb17ac082bd3f3af3dad8c8d36d9ea56360c520e", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.6442251172883741, "ground_truth": 0}, {"key": "fb17ac082bd3f3af3dad8c8d36d9ea56360c520e", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.6619228483894882, "ground_truth": 0}, {"key": "fb17ac082bd3f3af3dad8c8d36d9ea56360c520e", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.5888891265102077, "ground_truth": 0}, {"key": "59f079f6095cbb82b0eaaa0ba5fc29cdaff1f81b", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.602061572391273, "ground_truth": 0}, {"key": "59f079f6095cbb82b0eaaa0ba5fc29cdaff1f81b", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.6113819687679762, "ground_truth": 0}, {"key": "59f079f6095cbb82b0eaaa0ba5fc29cdaff1f81b", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.8344068769844593, "ground_truth": 0}, {"key": "59f079f6095cbb82b0eaaa0ba5fc29cdaff1f81b", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.7217432086477847, "ground_truth": 0}, {"key": "59f079f6095cbb82b0eaaa0ba5fc29cdaff1f81b", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.3629692042518293, "ground_truth": 0}, {"key": "083bc4309f2ea52be2a378e78566d7dcc9f4dd73", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.48438007641994263, "ground_truth": 0}, {"key": "083bc4309f2ea52be2a378e78566d7dcc9f4dd73", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.7476159482609932, "ground_truth": 0}, {"key": "083bc4309f2ea52be2a378e78566d7dcc9f4dd73", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.6757645847601309, "ground_truth": 0}, {"key": "083bc4309f2ea52be2a378e78566d7dcc9f4dd73", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.7786493079690601, "ground_truth": 0}, {"key": "083bc4309f2ea52be2a378e78566d7dcc9f4dd73", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.6132365553669602, "ground_truth": 0}, {"key": "ac56bd50e449bfa1d7b923415afa2ae5f7c83392", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.7943849640940069, "ground_truth": 0}, {"key": "ac56bd50e449bfa1d7b923415afa2ae5f7c83392", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.8068526269054861, "ground_truth": 0}, {"key": "ac56bd50e449bfa1d7b923415afa2ae5f7c83392", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.7248702555448534, "ground_truth": 0}, {"key": "ac56bd50e449bfa1d7b923415afa2ae5f7c83392", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.8998277839334416, "ground_truth": 0}, {"key": "ac56bd50e449bfa1d7b923415afa2ae5f7c83392", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.6584175158230553, "ground_truth": 0}, {"key": "61e4747776bd844146a9b8c7c1913c827ffbcd8a", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.9167080687969191, "ground_truth": 0}, {"key": "61e4747776bd844146a9b8c7c1913c827ffbcd8a", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.896251371776308, "ground_truth": 0}, {"key": "61e4747776bd844146a9b8c7c1913c827ffbcd8a", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.948537236505957, "ground_truth": 0}, {"key": "61e4747776bd844146a9b8c7c1913c827ffbcd8a", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.9219218388252969, "ground_truth": 0}, {"key": "61e4747776bd844146a9b8c7c1913c827ffbcd8a", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.9515039931246855, "ground_truth": 0}, {"key": "a9854fc40719b0d083a3fd279b6196188228a4e0", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.4707365793200244, "ground_truth": 0}, {"key": "a9854fc40719b0d083a3fd279b6196188228a4e0", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.548673508402936, "ground_truth": 0}, {"key": "a9854fc40719b0d083a3fd279b6196188228a4e0", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.42441198043539485, "ground_truth": 0}, {"key": "a9854fc40719b0d083a3fd279b6196188228a4e0", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.5640984740472856, "ground_truth": 0}, {"key": "a9854fc40719b0d083a3fd279b6196188228a4e0", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.7233094587968342, "ground_truth": 0}, {"key": "8d37ab9fcd0248c093f6d0e5682782ebdaf5e837", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.8596637505133342, "ground_truth": 0}, {"key": "8d37ab9fcd0248c093f6d0e5682782ebdaf5e837", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.7461389889163106, "ground_truth": 0}, {"key": "8d37ab9fcd0248c093f6d0e5682782ebdaf5e837", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.5506073656923407, "ground_truth": 0}, {"key": "8d37ab9fcd0248c093f6d0e5682782ebdaf5e837", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.7248702833622941, "ground_truth": 0}, {"key": "8d37ab9fcd0248c093f6d0e5682782ebdaf5e837", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.7839884474652451, "ground_truth": 0}, {"key": "d3199d123dedcdbae55b2e9d1f658717c1d5e233", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.6791787024891143, "ground_truth": 0}, {"key": "d3199d123dedcdbae55b2e9d1f658717c1d5e233", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.38306414557170865, "ground_truth": 0}, {"key": "d3199d123dedcdbae55b2e9d1f658717c1d5e233", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.5428632668801541, "ground_truth": 0}, {"key": "d3199d123dedcdbae55b2e9d1f658717c1d5e233", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.6113819542865527, "ground_truth": 0}, {"key": "d3199d123dedcdbae55b2e9d1f658717c1d5e233", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.5331544073799269, "ground_truth": 0}, {"key": "f249ede5a3cafd2506ff2bb400291a7db1c43b76", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.6825737145140067, "ground_truth": 0}, {"key": "f249ede5a3cafd2506ff2bb400291a7db1c43b76", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.44939263260002593, "ground_truth": 0}, {"key": "f249ede5a3cafd2506ff2bb400291a7db1c43b76", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.43782349979969437, "ground_truth": 0}, {"key": "f249ede5a3cafd2506ff2bb400291a7db1c43b76", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.5156199378392373, "ground_truth": 0}, {"key": "f249ede5a3cafd2506ff2bb400291a7db1c43b76", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.5563995836173324, "ground_truth": 0}, {"key": "6343a202a70e8c5d3bfa4042bfd087d78ca5805e", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.5428632694947108, "ground_truth": 0}, {"key": "6343a202a70e8c5d3bfa4042bfd087d78ca5805e", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.4921881356773925, "ground_truth": 0}, {"key": "6343a202a70e8c5d3bfa4042bfd087d78ca5805e", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.3328523247219736, "ground_truth": 0}, {"key": "6343a202a70e8c5d3bfa4042bfd087d78ca5805e", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.37387581320162855, "ground_truth": 0}, {"key": "6343a202a70e8c5d3bfa4042bfd087d78ca5805e", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.3073580159205212, "ground_truth": 0}, {"key": "da0d41b431367b51fd995573cb498c10b7f64ca0", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.6095241514653554, "ground_truth": 0}, {"key": "da0d41b431367b51fd995573cb498c10b7f64ca0", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.4921881346455882, "ground_truth": 0}, {"key": "da0d41b431367b51fd995573cb498c10b7f64ca0", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.32252599481182165, "ground_truth": 0}, {"key": "da0d41b431367b51fd995573cb498c10b7f64ca0", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.47852885429973996, "ground_truth": 0}, {"key": "da0d41b431367b51fd995573cb498c10b7f64ca0", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.37754067599247343, "ground_truth": 0}, {"key": "0620ff5fa324a35b4be54bbd2de49b42bdd0d7c0", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.781330623840079, "ground_truth": 0}, {"key": "0620ff5fa324a35b4be54bbd2de49b42bdd0d7c0", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.4824290870749711, "ground_truth": 0}, {"key": "0620ff5fa324a35b4be54bbd2de49b42bdd0d7c0", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.7662936539493875, "ground_truth": 0}, {"key": "0620ff5fa324a35b4be54bbd2de49b42bdd0d7c0", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.735641639117099, "ground_truth": 0}, {"key": "0620ff5fa324a35b4be54bbd2de49b42bdd0d7c0", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.7732163708106945, "ground_truth": 0}, {"key": "f0eb8f9eee266512eb604a51b482833e202531d8", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.6566582656930954, "ground_truth": 0}, {"key": "f0eb8f9eee266512eb604a51b482833e202531d8", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.3775406782847848, "ground_truth": 0}, {"key": "f0eb8f9eee266512eb604a51b482833e202531d8", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.5640984861319724, "ground_truth": 0}, {"key": "f0eb8f9eee266512eb604a51b482833e202531d8", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.7759445323122002, "ground_truth": 0}, {"key": "f0eb8f9eee266512eb604a51b482833e202531d8", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.8365545627497325, "ground_truth": 0}, {"key": "c8f743307d5d1f7f19f1474d68c9390b22f6d076", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.743168021759562, "ground_truth": 0}, {"key": "c8f743307d5d1f7f19f1474d68c9390b22f6d076", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.5058591237821662, "ground_truth": 0}, {"key": "c8f743307d5d1f7f19f1474d68c9390b22f6d076", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.7341195409512778, "ground_truth": 0}, {"key": "c8f743307d5d1f7f19f1474d68c9390b22f6d076", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.7853085728581198, "ground_truth": 0}, {"key": "c8f743307d5d1f7f19f1474d68c9390b22f6d076", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.7690802431308524, "ground_truth": 0}, {"key": "5978abfdad91e604840a2dcc993df5ade9448e82", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.8407825856281247, "ground_truth": 0}, {"key": "5978abfdad91e604840a2dcc993df5ade9448e82", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.8887587840994499, "ground_truth": 0}, {"key": "5978abfdad91e604840a2dcc993df5ade9448e82", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.8068526165592343, "ground_truth": 0}, {"key": "5978abfdad91e604840a2dcc993df5ade9448e82", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.8449215266260459, "ground_truth": 0}, {"key": "5978abfdad91e604840a2dcc993df5ade9448e82", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.7892336970497071, "ground_truth": 0}, {"key": "5bcd4e61b39cc7ffff38ad88cd40afa208b18528", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.5679366119619335, "ground_truth": 0}, {"key": "5bcd4e61b39cc7ffff38ad88cd40afa208b18528", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.7371581734467794, "ground_truth": 0}, {"key": "5bcd4e61b39cc7ffff38ad88cd40afa208b18528", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.6976089293656295, "ground_truth": 0}, {"key": "5bcd4e61b39cc7ffff38ad88cd40afa208b18528", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.6548947078619314, "ground_truth": 0}, {"key": "5bcd4e61b39cc7ffff38ad88cd40afa208b18528", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.825589721063555, "ground_truth": 0}, {"key": "44815c184e3013f07781311b30ec5ff009174738", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.6095241594325367, "ground_truth": 0}, {"key": "44815c184e3013f07781311b30ec5ff009174738", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.4320633705080364, "ground_truth": 0}, {"key": "44815c184e3013f07781311b30ec5ff009174738", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.5, "ground_truth": 0}, {"key": "44815c184e3013f07781311b30ec5ff009174738", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.7025300403913275, "ground_truth": 0}, {"key": "44815c184e3013f07781311b30ec5ff009174738", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.2628418568532812, "ground_truth": 0}, {"key": "d7783bd2bf5ad92156962380342411c2eb068853", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.8766343822070188, "ground_truth": 0}, {"key": "d7783bd2bf5ad92156962380342411c2eb068853", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.6671476717759609, "ground_truth": 0}, {"key": "d7783bd2bf5ad92156962380342411c2eb068853", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.7217432160777176, "ground_truth": 0}, {"key": "d7783bd2bf5ad92156962380342411c2eb068853", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.7090191248280002, "ground_truth": 0}, {"key": "d7783bd2bf5ad92156962380342411c2eb068853", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.8652240683443859, "ground_truth": 0}, {"key": "4963edb0ad2703e9f6c54593149d9b81e7ada91f", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.5888891263970755, "ground_truth": 0}, {"key": "4963edb0ad2703e9f6c54593149d9b81e7ada91f", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.5448013961095602, "ground_truth": 0}, {"key": "4963edb0ad2703e9f6c54593149d9b81e7ada91f", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.6261241746191611, "ground_truth": 0}, {"key": "4963edb0ad2703e9f6c54593149d9b81e7ada91f", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.4980468884061923, "ground_truth": 0}, {"key": "4963edb0ad2703e9f6c54593149d9b81e7ada91f", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.6297746313575444, "ground_truth": 0}, {"key": "51b9a2d46dac43952e713874a5769be5ae350626", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.8175744749693502, "ground_truth": 0}, {"key": "51b9a2d46dac43952e713874a5769be5ae350626", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.46101679817497426, "ground_truth": 0}, {"key": "51b9a2d46dac43952e713874a5769be5ae350626", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.6584174918008989, "ground_truth": 0}, {"key": "51b9a2d46dac43952e713874a5769be5ae350626", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.32594948867824, "ground_truth": 0}, {"key": "51b9a2d46dac43952e713874a5769be5ae350626", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.644225105347179, "ground_truth": 0}, {"key": "d670da295571f998bd0864540e2acd109d077131", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.6859494400109108, "ground_truth": 0}, {"key": "d670da295571f998bd0864540e2acd109d077131", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.41300354732449546, "ground_truth": 0}, {"key": "d670da295571f998bd0864540e2acd109d077131", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.5370413738922263, "ground_truth": 0}, {"key": "d670da295571f998bd0864540e2acd109d077131", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.6187804641233619, "ground_truth": 0}, {"key": "d670da295571f998bd0864540e2acd109d077131", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.7461389836980646, "ground_truth": 0}, {"key": "f2f2246150d06734b2fab694a39bd8d693c7d255", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.5467381564135536, "ground_truth": 0}, {"key": "f2f2246150d06734b2fab694a39bd8d693c7d255", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.4960938197968829, "ground_truth": 0}, {"key": "f2f2246150d06734b2fab694a39bd8d693c7d255", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.41679663684790724, "ground_truth": 0}, {"key": "f2f2246150d06734b2fab694a39bd8d693c7d255", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.45519859367147186, "ground_truth": 0}, {"key": "f2f2246150d06734b2fab694a39bd8d693c7d255", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.6315942895534058, "ground_truth": 0}, {"key": "3cc0409612242093f34ea1d8ca1679f434955cff", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.43974733939988064, "ground_truth": 0}, {"key": "3cc0409612242093f34ea1d8ca1679f434955cff", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.6706082800831242, "ground_truth": 0}, {"key": "3cc0409612242093f34ea1d8ca1679f434955cff", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.4263215877913855, "ground_truth": 0}, {"key": "3cc0409612242093f34ea1d8ca1679f434955cff", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.7401743711298309, "ground_truth": 0}, {"key": "3cc0409612242093f34ea1d8ca1679f434955cff", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.5774953636200395, "ground_truth": 0}, {"key": "a67c4eaf797da7df18a715cd30c6cf11db96c954", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.5156198890310836, "ground_truth": 0}, {"key": "a67c4eaf797da7df18a715cd30c6cf11db96c954", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.5945512405949855, "ground_truth": 0}, {"key": "a67c4eaf797da7df18a715cd30c6cf11db96c954", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.3522017914436642, "ground_truth": 0}, {"key": "a67c4eaf797da7df18a715cd30c6cf11db96c954", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.432063400406166, "ground_truth": 0}, {"key": "a67c4eaf797da7df18a715cd30c6cf11db96c954", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.7310585729631451, "ground_truth": 0}, {"key": "58456413c8bd03a8ce70eb0061af07c6a9824fc3", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.2798284903666232, "ground_truth": 0}, {"key": "58456413c8bd03a8ce70eb0061af07c6a9824fc3", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.3757064595927649, "ground_truth": 0}, {"key": "58456413c8bd03a8ce70eb0061af07c6a9824fc3", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.2583260010742531, "ground_truth": 0}, {"key": "58456413c8bd03a8ce70eb0061af07c6a9824fc3", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.3328523410345304, "ground_truth": 0}, {"key": "58456413c8bd03a8ce70eb0061af07c6a9824fc3", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.22405546872988194, "ground_truth": 0}, {"key": "da040b67082b56436ccc8479a4e435cbf892a1f2", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.214691410107477, "ground_truth": 0}, {"key": "da040b67082b56436ccc8479a4e435cbf892a1f2", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.18952109656646762, "ground_truth": 0}, {"key": "da040b67082b56436ccc8479a4e435cbf892a1f2", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.2991051864493091, "ground_truth": 0}, {"key": "da040b67082b56436ccc8479a4e435cbf892a1f2", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.6531269114574337, "ground_truth": 0}, {"key": "da040b67082b56436ccc8479a4e435cbf892a1f2", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.38676344452234185, "ground_truth": 0}, {"key": "c71748bb246a2b05e676862b75b38fa03bf6646e", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.4148988436885484, "ground_truth": 0}, {"key": "c71748bb246a2b05e676862b75b38fa03bf6646e", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.5660185187232718, "ground_truth": 0}, {"key": "c71748bb246a2b05e676862b75b38fa03bf6646e", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.4397473396451625, "ground_truth": 0}, {"key": "c71748bb246a2b05e676862b75b38fa03bf6646e", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.388618031794342, "ground_truth": 0}, {"key": "c71748bb246a2b05e676862b75b38fa03bf6646e", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.5097643843554617, "ground_truth": 0}, {"key": "800f8dc06596c30444526bf31dd0db7504391a82", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.7662936619119944, "ground_truth": 0}, {"key": "800f8dc06596c30444526bf31dd0db7504391a82", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.8766343836911814, "ground_truth": 0}, {"key": "800f8dc06596c30444526bf31dd0db7504391a82", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.8428631338180409, "ground_truth": 0}, {"key": "800f8dc06596c30444526bf31dd0db7504391a82", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.624293512585638, "ground_truth": 0}, {"key": "800f8dc06596c30444526bf31dd0db7504391a82", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.830043777911117, "ground_truth": 0}, {"key": "3b0ed227dc7e5292e302183282d8bbe23d7b1db2", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.19559408594129707, "ground_truth": 0}, {"key": "3b0ed227dc7e5292e302183282d8bbe23d7b1db2", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.20946970275999463, "ground_truth": 0}, {"key": "3b0ed227dc7e5292e302183282d8bbe23d7b1db2", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.2893717156147942, "ground_truth": 0}, {"key": "3b0ed227dc7e5292e302183282d8bbe23d7b1db2", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.42632156271632143, "ground_truth": 0}, {"key": "3b0ed227dc7e5292e302183282d8bbe23d7b1db2", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.38861800734423363, "ground_truth": 0}, {"key": "1e713005e16983f75222235967c0cbeb0b944f80", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.7634837736361175, "ground_truth": 0}, {"key": "1e713005e16983f75222235967c0cbeb0b944f80", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.583203332564131, "ground_truth": 0}, {"key": "1e713005e16983f75222235967c0cbeb0b944f80", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.8152325083806298, "ground_truth": 0}, {"key": "1e713005e16983f75222235967c0cbeb0b944f80", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.6636689450427855, "ground_truth": 0}, {"key": "1e713005e16983f75222235967c0cbeb0b944f80", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.7201715102507655, "ground_truth": 0}, {"key": "360ae10bc8bd30a2aca7bc6b7000e138af63adb1", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.9196425316784763, "ground_truth": 0}, {"key": "360ae10bc8bd30a2aca7bc6b7000e138af63adb1", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.8187367940938823, "ground_truth": 0}, {"key": "360ae10bc8bd30a2aca7bc6b7000e138af63adb1", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.6757646147251806, "ground_truth": 0}, {"key": "360ae10bc8bd30a2aca7bc6b7000e138af63adb1", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.8128673189433635, "ground_truth": 0}, {"key": "360ae10bc8bd30a2aca7bc6b7000e138af63adb1", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.9532750435205024, "ground_truth": 0}, {"key": "50e996059a005d15e3e89b5a3c3695309671ed34", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.7662936621931393, "ground_truth": 0}, {"key": "50e996059a005d15e3e89b5a3c3695309671ed34", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.6706082752631662, "ground_truth": 0}, {"key": "50e996059a005d15e3e89b5a3c3695309671ed34", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.8397339652524388, "ground_truth": 0}, {"key": "50e996059a005d15e3e89b5a3c3695309671ed34", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.7956581168807029, "ground_truth": 0}, {"key": "50e996059a005d15e3e89b5a3c3695309671ed34", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.8128673308647597, "ground_truth": 0}, {"key": "ccc7f6a2139593c47f6b5880f1e3eef9e7a69734", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.23231015615783215, "ground_truth": 0}, {"key": "ccc7f6a2139593c47f6b5880f1e3eef9e7a69734", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.45326186712639693, "ground_truth": 0}, {"key": "ccc7f6a2139593c47f6b5880f1e3eef9e7a69734", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.2877678126374729, "ground_truth": 0}, {"key": "ccc7f6a2139593c47f6b5880f1e3eef9e7a69734", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.2974699569339525, "ground_truth": 0}, {"key": "ccc7f6a2139593c47f6b5880f1e3eef9e7a69734", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.3720488002600912, "ground_truth": 0}, {"key": "f4f90d4ff5af3e3648055673e040f0f43ae076d2", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.577495366924989, "ground_truth": 0}, {"key": "f4f90d4ff5af3e3648055673e040f0f43ae076d2", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.49414088638931697, "ground_truth": 0}, {"key": "f4f90d4ff5af3e3648055673e040f0f43ae076d2", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.6976089180527991, "ground_truth": 0}, {"key": "f4f90d4ff5af3e3648055673e040f0f43ae076d2", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.6842640381885138, "ground_truth": 0}, {"key": "f4f90d4ff5af3e3648055673e040f0f43ae076d2", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.5058591055448642, "ground_truth": 0}, {"key": "6c9ec6b9d3e936d2394f74354d577fdfcdd985a3", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.34864513861675667, "ground_truth": 0}, {"key": "6c9ec6b9d3e936d2394f74354d577fdfcdd985a3", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.5525396948883037, "ground_truth": 0}, {"key": "6c9ec6b9d3e936d2394f74354d577fdfcdd985a3", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.6095241691895374, "ground_truth": 0}, {"key": "6c9ec6b9d3e936d2394f74354d577fdfcdd985a3", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.27669053084934686, "ground_truth": 0}, {"key": "6c9ec6b9d3e936d2394f74354d577fdfcdd985a3", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.1510278107231112, "ground_truth": 0}, {"key": "438a2046f4465fb1f6dab1cb327ef9ca86a4cc0d", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.5117166205815965, "ground_truth": 0}, {"key": "438a2046f4465fb1f6dab1cb327ef9ca86a4cc0d", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.4687906254949931, "ground_truth": 0}, {"key": "438a2046f4465fb1f6dab1cb327ef9ca86a4cc0d", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.35577488724753253, "ground_truth": 0}, {"key": "438a2046f4465fb1f6dab1cb327ef9ca86a4cc0d", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.47657966312310646, "ground_truth": 0}, {"key": "438a2046f4465fb1f6dab1cb327ef9ca86a4cc0d", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.7401743674815535, "ground_truth": 0}, {"key": "73818f6c987b3604b8bc92c4fb03bc68af196b77", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.6757646153809799, "ground_truth": 0}, {"key": "73818f6c987b3604b8bc92c4fb03bc68af196b77", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.4455295344278487, "ground_truth": 0}, {"key": "73818f6c987b3604b8bc92c4fb03bc68af196b77", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.6297746077464972, "ground_truth": 0}, {"key": "73818f6c987b3604b8bc92c4fb03bc68af196b77", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.4054487265570751, "ground_truth": 0}, {"key": "73818f6c987b3604b8bc92c4fb03bc68af196b77", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.6169358278533764, "ground_truth": 0}, {"key": "f06d91f46326752b02cdc48e8fa472dcc38a0846", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.47463118760137807, "ground_truth": 0}, {"key": "f06d91f46326752b02cdc48e8fa472dcc38a0846", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.36116471617864876, "ground_truth": 0}, {"key": "f06d91f46326752b02cdc48e8fa472dcc38a0846", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.586996414978652, "ground_truth": 0}, {"key": "f06d91f46326752b02cdc48e8fa472dcc38a0846", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.577495372975895, "ground_truth": 0}, {"key": "f06d91f46326752b02cdc48e8fa472dcc38a0846", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.6352224218802677, "ground_truth": 0}, {"key": "c54bee6384d58517757ad5a8a30ea6dc59980a07", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.30569732398083077, "ground_truth": 0}, {"key": "c54bee6384d58517757ad5a8a30ea6dc59980a07", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.3867634531711502, "ground_truth": 0}, {"key": "c54bee6384d58517757ad5a8a30ea6dc59980a07", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.4054487416792976, "ground_truth": 0}, {"key": "c54bee6384d58517757ad5a8a30ea6dc59980a07", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.19072402269540714, "ground_truth": 0}, {"key": "c54bee6384d58517757ad5a8a30ea6dc59980a07", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.556399625390586, "ground_truth": 0}, {"key": "2757ff294ae08e977ed6a2b6e1854210f28f12c9", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.7969253711350273, "ground_truth": 0}, {"key": "2757ff294ae08e977ed6a2b6e1854210f28f12c9", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.858718588651624, "ground_truth": 0}, {"key": "2757ff294ae08e977ed6a2b6e1854210f28f12c9", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.8757869903944173, "ground_truth": 0}, {"key": "2757ff294ae08e977ed6a2b6e1854210f28f12c9", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.9046505391418957, "ground_truth": 0}, {"key": "2757ff294ae08e977ed6a2b6e1854210f28f12c9", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.7648916206251428, "ground_truth": 0}, {"key": "6a004c991c482f664ab8ac78df0bda26860b1c7a", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.6039318334452054, "ground_truth": 0}, {"key": "6a004c991c482f664ab8ac78df0bda26860b1c7a", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.45326185709455835, "ground_truth": 0}, {"key": "6a004c991c482f664ab8ac78df0bda26860b1c7a", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.42632159331057345, "ground_truth": 0}, {"key": "6a004c991c482f664ab8ac78df0bda26860b1c7a", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.1835936229877991, "ground_truth": 0}, {"key": "6a004c991c482f664ab8ac78df0bda26860b1c7a", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.29746992482280393, "ground_truth": 0}, {"key": "69159eadf4dcb2b7850f3a4db6454f8209f33e3a", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.5736784124171002, "ground_truth": 0}, {"key": "69159eadf4dcb2b7850f3a4db6454f8209f33e3a", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.7356416373036572, "ground_truth": 0}, {"key": "69159eadf4dcb2b7850f3a4db6454f8209f33e3a", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.46490155325653937, "ground_truth": 0}, {"key": "69159eadf4dcb2b7850f3a4db6454f8209f33e3a", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.5755880140084108, "ground_truth": 0}, {"key": "69159eadf4dcb2b7850f3a4db6454f8209f33e3a", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.7772998492420112, "ground_truth": 0}, {"key": "c6129a4c1fbd5680f512da18fb60a19a74f4959e", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.6943026665820472, "ground_truth": 0}, {"key": "c6129a4c1fbd5680f512da18fb60a19a74f4959e", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.5926666078287685, "ground_truth": 0}, {"key": "c6129a4c1fbd5680f512da18fb60a19a74f4959e", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.5156199182242434, "ground_truth": 0}, {"key": "c6129a4c1fbd5680f512da18fb60a19a74f4959e", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.7826624950868557, "ground_truth": 0}, {"key": "c6129a4c1fbd5680f512da18fb60a19a74f4959e", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.7520125641940877, "ground_truth": 0}, {"key": "1fe7d16db2c7a742dc1bcf04bfb8e285e7909f03", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.8864204052080729, "ground_truth": 0}, {"key": "1fe7d16db2c7a742dc1bcf04bfb8e285e7909f03", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.8799743747464944, "ground_truth": 0}, {"key": "1fe7d16db2c7a742dc1bcf04bfb8e285e7909f03", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.927887792566746, "ground_truth": 0}, {"key": "1fe7d16db2c7a742dc1bcf04bfb8e285e7909f03", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.8479677707580333, "ground_truth": 0}, {"key": "1fe7d16db2c7a742dc1bcf04bfb8e285e7909f03", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.8539127586617865, "ground_truth": 0}, {"key": "e0ddf766661004eb3ff337d95e249073410f0755", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.7534666609893764, "ground_truth": 0}, {"key": "e0ddf766661004eb3ff337d95e249073410f0755", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.695958323547705, "ground_truth": 0}, {"key": "e0ddf766661004eb3ff337d95e249073410f0755", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.4610167882857992, "ground_truth": 0}, {"key": "e0ddf766661004eb3ff337d95e249073410f0755", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.6842640125530752, "ground_truth": 0}, {"key": "e0ddf766661004eb3ff337d95e249073410f0755", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.6636689519697907, "ground_truth": 0}, {"key": "dd37d70b837b24247e9abafe8fb5bc5fae5de464", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.5698526532394723, "ground_truth": 0}, {"key": "dd37d70b837b24247e9abafe8fb5bc5fae5de464", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.6688802676791602, "ground_truth": 0}, {"key": "dd37d70b837b24247e9abafe8fb5bc5fae5de464", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.6566582667824464, "ground_truth": 0}, {"key": "dd37d70b837b24247e9abafe8fb5bc5fae5de464", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.6261241808068537, "ground_truth": 0}, {"key": "dd37d70b837b24247e9abafe8fb5bc5fae5de464", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.3793783786441116, "ground_truth": 0}, {"key": "6e3028e9ae17ab59abc7732fe840468ac9dcb60c", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.4416729956709778, "ground_truth": 0}, {"key": "6e3028e9ae17ab59abc7732fe840468ac9dcb60c", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.3849121487416647, "ground_truth": 0}, {"key": "6e3028e9ae17ab59abc7732fe840468ac9dcb60c", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.2598256511395972, "ground_truth": 0}, {"key": "6e3028e9ae17ab59abc7732fe840468ac9dcb60c", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.20181322975039503, "ground_truth": 0}, {"key": "6e3028e9ae17ab59abc7732fe840468ac9dcb60c", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.3090237055641888, "ground_truth": 0}, {"key": "24d2f15f65bfb5608c75d19ba07fc410aab4d9c6", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.9656413113515174, "ground_truth": 0}, {"key": "24d2f15f65bfb5608c75d19ba07fc410aab4d9c6", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.9750122055200635, "ground_truth": 0}, {"key": "24d2f15f65bfb5608c75d19ba07fc410aab4d9c6", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.9485372392089825, "ground_truth": 0}, {"key": "24d2f15f65bfb5608c75d19ba07fc410aab4d9c6", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.9700134929711037, "ground_truth": 0}, {"key": "24d2f15f65bfb5608c75d19ba07fc410aab4d9c6", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.9575961730622465, "ground_truth": 0}, {"key": "698329cc7a8d796d7635bf59d2435aa22c1a38e6", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.5039061694788307, "ground_truth": 0}, {"key": "698329cc7a8d796d7635bf59d2435aa22c1a38e6", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.6206216154097025, "ground_truth": 0}, {"key": "698329cc7a8d796d7635bf59d2435aa22c1a38e6", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.29910520735316165, "ground_truth": 0}, {"key": "698329cc7a8d796d7635bf59d2435aa22c1a38e6", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.4016877911392617, "ground_truth": 0}, {"key": "698329cc7a8d796d7635bf59d2435aa22c1a38e6", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.38121956737830515, "ground_truth": 0}, {"key": "b531a8ba685e8d461d0a491f35c9970c3dddf3dd", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.638835285663662, "ground_truth": 0}, {"key": "b531a8ba685e8d461d0a491f35c9970c3dddf3dd", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.6757645865157665, "ground_truth": 0}, {"key": "b531a8ba685e8d461d0a491f35c9970c3dddf3dd", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.5794004237062877, "ground_truth": 0}, {"key": "b531a8ba685e8d461d0a491f35c9970c3dddf3dd", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.6352224444772816, "ground_truth": 0}, {"key": "b531a8ba685e8d461d0a491f35c9970c3dddf3dd", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.6654105490187038, "ground_truth": 0}, {"key": "5b0e686b4679910743337ce02b36dd71a5caf5eb", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.31405056503707773, "ground_truth": 0}, {"key": "5b0e686b4679910743337ce02b36dd71a5caf5eb", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.36116472155403156, "ground_truth": 0}, {"key": "5b0e686b4679910743337ce02b36dd71a5caf5eb", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.3023910752735876, "ground_truth": 0}, {"key": "5b0e686b4679910743337ce02b36dd71a5caf5eb", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.4455295184119201, "ground_truth": 0}, {"key": "5b0e686b4679910743337ce02b36dd71a5caf5eb", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.21469142405949926, "ground_truth": 0}, {"key": "980e6db610d9882443d61e36d955f02d983d3e76", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.6513548643263073, "ground_truth": 0}, {"key": "980e6db610d9882443d61e36d955f02d983d3e76", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.8449215327752232, "ground_truth": 0}, {"key": "980e6db610d9882443d61e36d955f02d983d3e76", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.35577488764471044, "ground_truth": 0}, {"key": "980e6db610d9882443d61e36d955f02d983d3e76", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.8548846378526547, "ground_truth": 0}, {"key": "980e6db610d9882443d61e36d955f02d983d3e76", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.877476782565147, "ground_truth": 0}, {"key": "6c18984d8f30ce196e9399200dd15e373e699267", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.7969253772390542, "ground_truth": 0}, {"key": "6c18984d8f30ce196e9399200dd15e373e699267", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.735641642063048, "ground_truth": 0}, {"key": "6c18984d8f30ce196e9399200dd15e373e699267", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.6976089284012039, "ground_truth": 0}, {"key": "6c18984d8f30ce196e9399200dd15e373e699267", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.7401743574160585, "ground_truth": 0}, {"key": "6c18984d8f30ce196e9399200dd15e373e699267", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.47657964022058485, "ground_truth": 0}, {"key": "e00f05efe2038fffc8eaa1e8eecbe9445a9483e5", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.717011873878083, "ground_truth": 0}, {"key": "e00f05efe2038fffc8eaa1e8eecbe9445a9483e5", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.7431680315501972, "ground_truth": 0}, {"key": "e00f05efe2038fffc8eaa1e8eecbe9445a9483e5", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.38861803502117676, "ground_truth": 0}, {"key": "e00f05efe2038fffc8eaa1e8eecbe9445a9483e5", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.6206216216486935, "ground_truth": 0}, {"key": "e00f05efe2038fffc8eaa1e8eecbe9445a9483e5", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.40168779937106747, "ground_truth": 0}, {"key": "9ce109dc50fe4eca8b2d0c926d5dbd1df5f49187", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.8092759705714568, "ground_truth": 0}, {"key": "9ce109dc50fe4eca8b2d0c926d5dbd1df5f49187", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.48047867771096403, "ground_truth": 0}, {"key": "9ce109dc50fe4eca8b2d0c926d5dbd1df5f49187", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.64601369675077, "ground_truth": 0}, {"key": "9ce109dc50fe4eca8b2d0c926d5dbd1df5f49187", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.5312093780918574, "ground_truth": 0}, {"key": "9ce109dc50fe4eca8b2d0c926d5dbd1df5f49187", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.6636689496110011, "ground_truth": 0}, {"key": "bbec538b4453859ee9c772c4de8f0eb28acd87c4", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.7931059581792524, "ground_truth": 0}, {"key": "bbec538b4453859ee9c772c4de8f0eb28acd87c4", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.6706082937876648, "ground_truth": 0}, {"key": "bbec538b4453859ee9c772c4de8f0eb28acd87c4", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.8596637506390626, "ground_truth": 0}, {"key": "bbec538b4453859ee9c772c4de8f0eb28acd87c4", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.48633151892273635, "ground_truth": 0}, {"key": "bbec538b4453859ee9c772c4de8f0eb28acd87c4", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.5175708786385843, "ground_truth": 0}, {"key": "c4e0587d1b8fcc06c2cc5cfcec42a34d314fbe44", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.5907792011528828, "ground_truth": 0}, {"key": "c4e0587d1b8fcc06c2cc5cfcec42a34d314fbe44", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.6334102429475109, "ground_truth": 0}, {"key": "c4e0587d1b8fcc06c2cc5cfcec42a34d314fbe44", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.7563575348133843, "ground_truth": 0}, {"key": "c4e0587d1b8fcc06c2cc5cfcec42a34d314fbe44", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.7745833840245077, "ground_truth": 0}, {"key": "c4e0587d1b8fcc06c2cc5cfcec42a34d314fbe44", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.8104788964342506, "ground_truth": 0}, {"key": "7eaaa5bfe35344ee85eeb871a4d31cd31b12965b", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.7648915938840307, "ground_truth": 0}, {"key": "7eaaa5bfe35344ee85eeb871a4d31cd31b12965b", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.7341195310990939, "ground_truth": 0}, {"key": "7eaaa5bfe35344ee85eeb871a4d31cd31b12965b", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.6460137010208907, "ground_truth": 0}, {"key": "7eaaa5bfe35344ee85eeb871a4d31cd31b12965b", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.6424324639427768, "ground_truth": 0}, {"key": "7eaaa5bfe35344ee85eeb871a4d31cd31b12965b", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.6706082811677208, "ground_truth": 0}, {"key": "9cce7373a54faccf5b5d1232c82afab9b29ab6b9", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.7401743627477199, "ground_truth": 0}, {"key": "9cce7373a54faccf5b5d1232c82afab9b29ab6b9", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.7956580923555483, "ground_truth": 0}, {"key": "9cce7373a54faccf5b5d1232c82afab9b29ab6b9", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.6169358621627972, "ground_truth": 0}, {"key": "9cce7373a54faccf5b5d1232c82afab9b29ab6b9", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.7264256156856636, "ground_truth": 0}, {"key": "9cce7373a54faccf5b5d1232c82afab9b29ab6b9", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.7592254088617723, "ground_truth": 0}, {"key": "1b37e549bbcec859711e5b2ef310e94deed4dc95", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.8175744719806183, "ground_truth": 0}, {"key": "1b37e549bbcec859711e5b2ef310e94deed4dc95", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.8080672164182439, "ground_truth": 0}, {"key": "1b37e549bbcec859711e5b2ef310e94deed4dc95", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.5409238501010389, "ground_truth": 0}, {"key": "1b37e549bbcec859711e5b2ef310e94deed4dc95", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.7892336976439293, "ground_truth": 0}, {"key": "1b37e549bbcec859711e5b2ef310e94deed4dc95", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.926835281552462, "ground_truth": 0}, {"key": "da780ee614304d195bde3b7549313c02990d072e", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.8210440988140622, "ground_truth": 0}, {"key": "da780ee614304d195bde3b7549313c02990d072e", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.6513548372880459, "ground_truth": 0}, {"key": "da780ee614304d195bde3b7549313c02990d072e", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.7325918370639015, "ground_truth": 0}, {"key": "da780ee614304d195bde3b7549313c02990d072e", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.7879312037486857, "ground_truth": 0}, {"key": "da780ee614304d195bde3b7549313c02990d072e", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.8633916069379733, "ground_truth": 0}, {"key": "e24cdc200182d698a34f564ba71f4948ce6760e5", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.4301473286583073, "ground_truth": 0}, {"key": "e24cdc200182d698a34f564ba71f4948ce6760e5", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.4882834120636394, "ground_truth": 0}, {"key": "e24cdc200182d698a34f564ba71f4948ce6760e5", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.5467381233564558, "ground_truth": 0}, {"key": "e24cdc200182d698a34f564ba71f4948ce6760e5", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.6261241779334279, "ground_truth": 0}, {"key": "e24cdc200182d698a34f564ba71f4948ce6760e5", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.4765796447372208, "ground_truth": 0}, {"key": "42483672c204aebcf7ba6e7d6ca4c628fe9a69e7", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.5409238736713875, "ground_truth": 0}, {"key": "42483672c204aebcf7ba6e7d6ca4c628fe9a69e7", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.5755879970041249, "ground_truth": 0}, {"key": "42483672c204aebcf7ba6e7d6ca4c628fe9a69e7", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.7233094788678797, "ground_truth": 0}, {"key": "42483672c204aebcf7ba6e7d6ca4c628fe9a69e7", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.7279754442713556, "ground_truth": 0}, {"key": "42483672c204aebcf7ba6e7d6ca4c628fe9a69e7", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.6654105750752544, "ground_truth": 0}, {"key": "3501c83d3dab4a2e4d2142522a4bf1510a64422a", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.41869692656079666, "ground_truth": 0}, {"key": "3501c83d3dab4a2e4d2142522a4bf1510a64422a", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.35936414046129117, "ground_truth": 0}, {"key": "3501c83d3dab4a2e4d2142522a4bf1510a64422a", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.22541660100884595, "ground_truth": 0}, {"key": "3501c83d3dab4a2e4d2142522a4bf1510a64422a", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.2081789340809115, "ground_truth": 0}, {"key": "3501c83d3dab4a2e4d2142522a4bf1510a64422a", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.19559408510423484, "ground_truth": 0}, {"key": "964589248c2d95ac3c734ad71283ca22ae4ecedf", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.7264255973425888, "ground_truth": 0}, {"key": "964589248c2d95ac3c734ad71283ca22ae4ecedf", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.8624675427035604, "ground_truth": 0}, {"key": "964589248c2d95ac3c734ad71283ca22ae4ecedf", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.7839884582075811, "ground_truth": 0}, {"key": "964589248c2d95ac3c734ad71283ca22ae4ecedf", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.647798222620945, "ground_truth": 0}, {"key": "964589248c2d95ac3c734ad71283ca22ae4ecedf", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.7839884698546877, "ground_truth": 0}, {"key": "6b72550a663bcb7a64e242ede6da53b1f585ea71", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.6671476779252802, "ground_truth": 0}, {"key": "6b72550a663bcb7a64e242ede6da53b1f585ea71", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.7505527404797585, "ground_truth": 0}, {"key": "6b72550a663bcb7a64e242ede6da53b1f585ea71", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.5039061450424933, "ground_truth": 0}, {"key": "6b72550a663bcb7a64e242ede6da53b1f585ea71", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.5234203300430326, "ground_truth": 0}, {"key": "6b72550a663bcb7a64e242ede6da53b1f585ea71", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.8031737899382497, "ground_truth": 0}, {"key": "c96bdfc0463d994ddc858ad358fe59371be79352", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.5292634023270768, "ground_truth": 0}, {"key": "c96bdfc0463d994ddc858ad358fe59371be79352", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.7025300453922938, "ground_truth": 0}, {"key": "c96bdfc0463d994ddc858ad358fe59371be79352", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.6584174800851778, "ground_truth": 0}, {"key": "c96bdfc0463d994ddc858ad358fe59371be79352", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.2877678185887143, "ground_truth": 0}, {"key": "c96bdfc0463d994ddc858ad358fe59371be79352", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.762070124122905, "ground_truth": 0}, {"key": "085dc5d706487da983655043b144952956cb3c5b", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.3468731158854337, "ground_truth": 0}, {"key": "085dc5d706487da983655043b144952956cb3c5b", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.32594951485040125, "ground_truth": 0}, {"key": "085dc5d706487da983655043b144952956cb3c5b", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.54673813102035, "ground_truth": 0}, {"key": "085dc5d706487da983655043b144952956cb3c5b", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.26435835568584154, "ground_truth": 0}, {"key": "085dc5d706487da983655043b144952956cb3c5b", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.2958398623795489, "ground_truth": 0}, {"key": "1c1dc1da2f6ba045478e25e91c8e1b039ce4cc67", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.8386797655418242, "ground_truth": 0}, {"key": "1c1dc1da2f6ba045478e25e91c8e1b039ce4cc67", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.7662936433486021, "ground_truth": 0}, {"key": "1c1dc1da2f6ba045478e25e91c8e1b039ce4cc67", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.8311430409292042, "ground_truth": 0}, {"key": "1c1dc1da2f6ba045478e25e91c8e1b039ce4cc67", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.6976089017401983, "ground_truth": 0}, {"key": "1c1dc1da2f6ba045478e25e91c8e1b039ce4cc67", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.7371581680786727, "ground_truth": 0}, {"key": "da90eb668bfc66a5e70b2e6631a5ec1c9ffb2413", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.5292633800757842, "ground_truth": 0}, {"key": "da90eb668bfc66a5e70b2e6631a5ec1c9ffb2413", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.6020615866832473, "ground_truth": 0}, {"key": "da90eb668bfc66a5e70b2e6631a5ec1c9ffb2413", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.744656355406196, "ground_truth": 0}, {"key": "da90eb668bfc66a5e70b2e6631a5ec1c9ffb2413", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.7866228168562382, "ground_truth": 0}, {"key": "da90eb668bfc66a5e70b2e6631a5ec1c9ffb2413", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.809275970105517, "ground_truth": 0}, {"key": "717b1934db9eb0d7e5e2aef75cd54b29a6530a59", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.2829881238714812, "ground_truth": 0}, {"key": "717b1934db9eb0d7e5e2aef75cd54b29a6530a59", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.4590761195024116, "ground_truth": 0}, {"key": "717b1934db9eb0d7e5e2aef75cd54b29a6530a59", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.5389832181228754, "ground_truth": 0}, {"key": "717b1934db9eb0d7e5e2aef75cd54b29a6530a59", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.305697314804617, "ground_truth": 0}, {"key": "717b1934db9eb0d7e5e2aef75cd54b29a6530a59", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.5292633874573563, "ground_truth": 0}, {"key": "e493fe7f282adb10c6b9af18d41f0181f17341e5", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.5428632645766628, "ground_truth": 0}, {"key": "e493fe7f282adb10c6b9af18d41f0181f17341e5", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.39420094362373115, "ground_truth": 0}, {"key": "e493fe7f282adb10c6b9af18d41f0181f17341e5", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.3575675222234779, "ground_truth": 0}, {"key": "e493fe7f282adb10c6b9af18d41f0181f17341e5", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.5794004005156933, "ground_truth": 0}, {"key": "e493fe7f282adb10c6b9af18d41f0181f17341e5", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.3702253888743948, "ground_truth": 0}, {"key": "e510fc72b8ef595e45f1a510d0cad761ae1bd032", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.4941408933188503, "ground_truth": 0}, {"key": "e510fc72b8ef595e45f1a510d0cad761ae1bd032", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.5117166148355901, "ground_truth": 0}, {"key": "e510fc72b8ef595e45f1a510d0cad761ae1bd032", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.2613309154687675, "ground_truth": 0}, {"key": "e510fc72b8ef595e45f1a510d0cad761ae1bd032", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.25683198633445986, "ground_truth": 0}, {"key": "e510fc72b8ef595e45f1a510d0cad761ae1bd032", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.28140561259568414, "ground_truth": 0}, {"key": "564e02cb944ea00c02f9832ab968441b5c67332e", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.7025300393728888, "ground_truth": 0}, {"key": "564e02cb944ea00c02f9832ab968441b5c67332e", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.7074046854969743, "ground_truth": 0}, {"key": "564e02cb944ea00c02f9832ab968441b5c67332e", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.5888891439142436, "ground_truth": 0}, {"key": "564e02cb944ea00c02f9832ab968441b5c67332e", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.8198933291998596, "ground_truth": 0}, {"key": "564e02cb944ea00c02f9832ab968441b5c67332e", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.7122321833592489, "ground_truth": 0}, {"key": "dfd0cea6589cb8be40538b9f165781fbc2c7d796", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.7879311980894154, "ground_truth": 0}, {"key": "dfd0cea6589cb8be40538b9f165781fbc2c7d796", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.7025300499794952, "ground_truth": 0}, {"key": "dfd0cea6589cb8be40538b9f165781fbc2c7d796", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.7217432018782547, "ground_truth": 0}, {"key": "dfd0cea6589cb8be40538b9f165781fbc2c7d796", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.8757869840855013, "ground_truth": 0}, {"key": "dfd0cea6589cb8be40538b9f165781fbc2c7d796", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.837619972536581, "ground_truth": 0}, {"key": "dbceded6ea7d8a0944ab3f44263f688f644a5c37", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.5640984838058537, "ground_truth": 0}, {"key": "dbceded6ea7d8a0944ab3f44263f688f644a5c37", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.5331543804011604, "ground_truth": 0}, {"key": "dbceded6ea7d8a0944ab3f44263f688f644a5c37", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.6791786937627442, "ground_truth": 0}, {"key": "dbceded6ea7d8a0944ab3f44263f688f644a5c37", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.6740504809399914, "ground_truth": 0}, {"key": "dbceded6ea7d8a0944ab3f44263f688f644a5c37", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.809275983977191, "ground_truth": 0}, {"key": "305a7272b28da5bc5574487ca0a09f48b852788c", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.4863315283795579, "ground_truth": 0}, {"key": "305a7272b28da5bc5574487ca0a09f48b852788c", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.5019531225121454, "ground_truth": 0}, {"key": "305a7272b28da5bc5574487ca0a09f48b852788c", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.5755880263899953, "ground_truth": 0}, {"key": "305a7272b28da5bc5574487ca0a09f48b852788c", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.4726834852765407, "ground_truth": 0}, {"key": "305a7272b28da5bc5574487ca0a09f48b852788c", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.5273165412875765, "ground_truth": 0}, {"key": "9814600b03458475607fa2e4e9f1637138b7c9bf", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.38121956977422616, "ground_truth": 0}, {"key": "9814600b03458475607fa2e4e9f1637138b7c9bf", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.5253688061789674, "ground_truth": 0}, {"key": "9814600b03458475607fa2e4e9f1637138b7c9bf", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.5525396964908964, "ground_truth": 0}, {"key": "9814600b03458475607fa2e4e9f1637138b7c9bf", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.5486734859538226, "ground_truth": 0}, {"key": "9814600b03458475607fa2e4e9f1637138b7c9bf", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.6187804294510165, "ground_truth": 0}, {"key": "d16bff688345742ee8a1762cb6b82b49e4a065dd", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.8128673104205942, "ground_truth": 0}, {"key": "d16bff688345742ee8a1762cb6b82b49e4a065dd", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.6406358367116374, "ground_truth": 0}, {"key": "d16bff688345742ee8a1762cb6b82b49e4a065dd", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.8386797714724671, "ground_truth": 0}, {"key": "d16bff688345742ee8a1762cb6b82b49e4a065dd", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.6723316674281867, "ground_truth": 0}, {"key": "d16bff688345742ee8a1762cb6b82b49e4a065dd", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.6495785967407404, "ground_truth": 0}, {"key": "c85a7eb698c39c7465d1fe4ebbb50447329b5497", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.98840263834386, "ground_truth": 0}, {"key": "c85a7eb698c39c7465d1fe4ebbb50447329b5497", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.9920620061229275, "ground_truth": 0}, {"key": "c85a7eb698c39c7465d1fe4ebbb50447329b5497", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.9839708527427363, "ground_truth": 0}, {"key": "c85a7eb698c39c7465d1fe4ebbb50447329b5497", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.9887554392064201, "ground_truth": 0}, {"key": "c85a7eb698c39c7465d1fe4ebbb50447329b5497", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.9780517449768033, "ground_truth": 0}, {"key": "5f299d74b492be5e53e6bcf3a54d3c8a4b418a97", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.23792990306360215, "ground_truth": 0}, {"key": "5f299d74b492be5e53e6bcf3a54d3c8a4b418a97", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.31069438993918247, "ground_truth": 0}, {"key": "5f299d74b492be5e53e6bcf3a54d3c8a4b418a97", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.21866936237245863, "ground_truth": 0}, {"key": "5f299d74b492be5e53e6bcf3a54d3c8a4b418a97", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.4863315357544608, "ground_truth": 0}, {"key": "5f299d74b492be5e53e6bcf3a54d3c8a4b418a97", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.15002882292513406, "ground_truth": 0}, {"key": "5a4e46a4e18d31d1ef4d1087b1643a349f10dd14", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.5869964353931464, "ground_truth": 0}, {"key": "5a4e46a4e18d31d1ef4d1087b1643a349f10dd14", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.9142907309022114, "ground_truth": 0}, {"key": "5a4e46a4e18d31d1ef4d1087b1643a349f10dd14", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.705785041121678, "ground_truth": 0}, {"key": "5a4e46a4e18d31d1ef4d1087b1643a349f10dd14", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.6584175182205001, "ground_truth": 0}, {"key": "5a4e46a4e18d31d1ef4d1087b1643a349f10dd14", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.7690802296363758, "ground_truth": 0}, {"key": "b6b7cbc40f51483708d53416719205f36c06f6df", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.8428631422996619, "ground_truth": 0}, {"key": "b6b7cbc40f51483708d53416719205f36c06f6df", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.7690802555803669, "ground_truth": 0}, {"key": "b6b7cbc40f51483708d53416719205f36c06f6df", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.9190632882117671, "ground_truth": 0}, {"key": "b6b7cbc40f51483708d53416719205f36c06f6df", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.6460136945929406, "ground_truth": 0}, {"key": "b6b7cbc40f51483708d53416719205f36c06f6df", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.7233094795232791, "ground_truth": 0}, {"key": "7c0bda3744be6f7d95eef695e59a4e4001455a35", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.5097643645420977, "ground_truth": 0}, {"key": "7c0bda3744be6f7d95eef695e59a4e4001455a35", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.6513548446306512, "ground_truth": 0}, {"key": "7c0bda3744be6f7d95eef695e59a4e4001455a35", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.472683474745208, "ground_truth": 0}, {"key": "7c0bda3744be6f7d95eef695e59a4e4001455a35", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.3106943823146562, "ground_truth": 0}, {"key": "7c0bda3744be6f7d95eef695e59a4e4001455a35", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.538983211850155, "ground_truth": 0}, {"key": "f19b17438e69527f376e5d9efc74d19fbac6f755", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.6206216039073447, "ground_truth": 0}, {"key": "f19b17438e69527f376e5d9efc74d19fbac6f755", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.31069438095311064, "ground_truth": 0}, {"key": "f19b17438e69527f376e5d9efc74d19fbac6f755", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.37754065650535706, "ground_truth": 0}, {"key": "f19b17438e69527f376e5d9efc74d19fbac6f755", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.37204877770780725, "ground_truth": 0}, {"key": "f19b17438e69527f376e5d9efc74d19fbac6f755", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.6039318424492419, "ground_truth": 0}, {"key": "eb2fe21af9629392d61a4fabe6cad72130525f2f", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.30735801394241086, "ground_truth": 0}, {"key": "eb2fe21af9629392d61a4fabe6cad72130525f2f", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.44939263945798275, "ground_truth": 0}, {"key": "eb2fe21af9629392d61a4fabe6cad72130525f2f", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.30902371702599474, "ground_truth": 0}, {"key": "eb2fe21af9629392d61a4fabe6cad72130525f2f", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.32423539843886645, "ground_truth": 0}, {"key": "eb2fe21af9629392d61a4fabe6cad72130525f2f", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.4186969144349432, "ground_truth": 0}, {"key": "eebebdc4fa08a6e927ab958a39d91f888550afec", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.6909762990069569, "ground_truth": 0}, {"key": "eebebdc4fa08a6e927ab958a39d91f888550afec", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.9142907309022114, "ground_truth": 0}, {"key": "eebebdc4fa08a6e927ab958a39d91f888550afec", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.8519527988964054, "ground_truth": 0}, {"key": "eebebdc4fa08a6e927ab958a39d91f888550afec", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.647798204108156, "ground_truth": 0}, {"key": "eebebdc4fa08a6e927ab958a39d91f888550afec", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.7634837628674703, "ground_truth": 0}, {"key": "94b15ad6efcd6d47dfcc242135be481fceb7f634", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.7759445610736073, "ground_truth": 0}, {"key": "94b15ad6efcd6d47dfcc242135be481fceb7f634", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.8688267648953368, "ground_truth": 0}, {"key": "94b15ad6efcd6d47dfcc242135be481fceb7f634", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.6636689668159663, "ground_truth": 0}, {"key": "94b15ad6efcd6d47dfcc242135be481fceb7f634", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.7969253749523529, "ground_truth": 0}, {"key": "94b15ad6efcd6d47dfcc242135be481fceb7f634", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.8791467787063121, "ground_truth": 0}, {"key": "504ed83e41a6a861927345f7a027ba53ad02237a", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.8116760210909197, "ground_truth": 0}, {"key": "504ed83e41a6a861927345f7a027ba53ad02237a", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.7461389889163106, "ground_truth": 0}, {"key": "504ed83e41a6a861927345f7a027ba53ad02237a", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.7356416387969833, "ground_truth": 0}, {"key": "504ed83e41a6a861927345f7a027ba53ad02237a", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.7341195287426873, "ground_truth": 0}, {"key": "504ed83e41a6a861927345f7a027ba53ad02237a", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.8080672059106405, "ground_truth": 0}, {"key": "42176b852f897ae19ef0cf39d598878c8ff0bced", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.29421497094192, "ground_truth": 0}, {"key": "42176b852f897ae19ef0cf39d598878c8ff0bced", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.46879060688871255, "ground_truth": 0}, {"key": "42176b852f897ae19ef0cf39d598878c8ff0bced", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.2043419043779301, "ground_truth": 0}, {"key": "42176b852f897ae19ef0cf39d598878c8ff0bced", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.25091279999419275, "ground_truth": 0}, {"key": "42176b852f897ae19ef0cf39d598878c8ff0bced", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.3960681576331574, "ground_truth": 0}, {"key": "62ac534bf7e3e897b2726dddf2b7b6f7723362d4", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.6424324795973407, "ground_truth": 0}, {"key": "62ac534bf7e3e897b2726dddf2b7b6f7723362d4", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.5888891261850945, "ground_truth": 0}, {"key": "62ac534bf7e3e897b2726dddf2b7b6f7723362d4", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.8407825945002452, "ground_truth": 0}, {"key": "62ac534bf7e3e897b2726dddf2b7b6f7723362d4", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.7025300490720859, "ground_truth": 0}, {"key": "62ac534bf7e3e897b2726dddf2b7b6f7723362d4", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.5331543809772217, "ground_truth": 0}, {"key": "4ff05ae8454ad482f81911c5e4275b63466bea35", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.6808786181781034, "ground_truth": 0}, {"key": "4ff05ae8454ad482f81911c5e4275b63466bea35", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.37754066059126395, "ground_truth": 0}, {"key": "4ff05ae8454ad482f81911c5e4275b63466bea35", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.5869964245048561, "ground_truth": 0}, {"key": "4ff05ae8454ad482f81911c5e4275b63466bea35", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.47657965488753185, "ground_truth": 0}, {"key": "4ff05ae8454ad482f81911c5e4275b63466bea35", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.6513548514231979, "ground_truth": 0}, {"key": "16e86dc5e3fe27875ee927741542536ea7b7553b", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.5019531149297211, "ground_truth": 0}, {"key": "16e86dc5e3fe27875ee927741542536ea7b7553b", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.45713669073208263, "ground_truth": 0}, {"key": "16e86dc5e3fe27875ee927741542536ea7b7553b", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.5312093609255683, "ground_truth": 0}, {"key": "16e86dc5e3fe27875ee927741542536ea7b7553b", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.3979384225837819, "ground_truth": 0}, {"key": "16e86dc5e3fe27875ee927741542536ea7b7553b", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.6406358602483854, "ground_truth": 0}, {"key": "ad55d2f13db6732edcd716e09f527ed2df39946f", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.6169358103653944, "ground_truth": 0}, {"key": "ad55d2f13db6732edcd716e09f527ed2df39946f", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.20181321932133606, "ground_truth": 0}, {"key": "ad55d2f13db6732edcd716e09f527ed2df39946f", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.3090237147680166, "ground_truth": 0}, {"key": "ad55d2f13db6732edcd716e09f527ed2df39946f", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.5039061697892853, "ground_truth": 0}, {"key": "ad55d2f13db6732edcd716e09f527ed2df39946f", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.2407745975982847, "ground_truth": 0}, {"key": "160228fe18f272761b969b08622ba868ad65b206", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.773216380220609, "ground_truth": 0}, {"key": "160228fe18f272761b969b08622ba868ad65b206", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.7356416304294408, "ground_truth": 0}, {"key": "160228fe18f272761b969b08622ba868ad65b206", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.5175709005897984, "ground_truth": 0}, {"key": "160228fe18f272761b969b08622ba868ad65b206", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.5214711911564595, "ground_truth": 0}, {"key": "160228fe18f272761b969b08622ba868ad65b206", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.8080672109337135, "ground_truth": 0}, {"key": "7ebb75bc91aa51d53b06fdbed7feb52d42612065", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.7341194983300704, "ground_truth": 0}, {"key": "7ebb75bc91aa51d53b06fdbed7feb52d42612065", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.8732148414288221, "ground_truth": 0}, {"key": "7ebb75bc91aa51d53b06fdbed7feb52d42612065", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.8732148269092734, "ground_truth": 0}, {"key": "7ebb75bc91aa51d53b06fdbed7feb52d42612065", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.8006919936646634, "ground_truth": 0}, {"key": "7ebb75bc91aa51d53b06fdbed7feb52d42612065", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.8311430380695111, "ground_truth": 0}, {"key": "a84e31bf36290e557a3080ad297177b6f18cdf84", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.8459424333548852, "ground_truth": 0}, {"key": "a84e31bf36290e557a3080ad297177b6f18cdf84", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.8233283970605567, "ground_truth": 0}, {"key": "a84e31bf36290e557a3080ad297177b6f18cdf84", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.6315943185266218, "ground_truth": 0}, {"key": "a84e31bf36290e557a3080ad297177b6f18cdf84", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.8962513803531725, "ground_truth": 0}, {"key": "a84e31bf36290e557a3080ad297177b6f18cdf84", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.8469578290422798, "ground_truth": 0}, {"key": "c43c7253f38ff2cd79770034ed9af3567cfaa811", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.6370308122052107, "ground_truth": 0}, {"key": "c43c7253f38ff2cd79770034ed9af3567cfaa811", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.6424324771787395, "ground_truth": 0}, {"key": "c43c7253f38ff2cd79770034ed9af3567cfaa811", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.6150878821713824, "ground_truth": 0}, {"key": "c43c7253f38ff2cd79770034ed9af3567cfaa811", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.5945512278912715, "ground_truth": 0}, {"key": "c43c7253f38ff2cd79770034ed9af3567cfaa811", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.5964331692833477, "ground_truth": 0}, {"key": "a4601415eafb5264a4bdc273de3a16365aefb35b", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.6169358179752997, "ground_truth": 0}, {"key": "a4601415eafb5264a4bdc273de3a16365aefb35b", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.7170118796693591, "ground_truth": 0}, {"key": "a4601415eafb5264a4bdc273de3a16365aefb35b", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.403566885229667, "ground_truth": 0}, {"key": "a4601415eafb5264a4bdc273de3a16365aefb35b", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.49804686616341176, "ground_truth": 0}, {"key": "a4601415eafb5264a4bdc273de3a16365aefb35b", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.6513548463399008, "ground_truth": 0}, {"key": "91d43f137b3d928561fb62b200ae40aee4a34b73", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.6424324698149241, "ground_truth": 0}, {"key": "91d43f137b3d928561fb62b200ae40aee4a34b73", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.7676898511407856, "ground_truth": 0}, {"key": "91d43f137b3d928561fb62b200ae40aee4a34b73", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.5409238672177455, "ground_truth": 0}, {"key": "91d43f137b3d928561fb62b200ae40aee4a34b73", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.7620701046766419, "ground_truth": 0}, {"key": "91d43f137b3d928561fb62b200ae40aee4a34b73", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.7008948137715424, "ground_truth": 0}, {"key": "ab2d99eedfd685ce685fa44e735695c27e946683", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.7490872081275268, "ground_truth": 0}, {"key": "ab2d99eedfd685ce685fa44e735695c27e946683", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.5640984997320283, "ground_truth": 0}, {"key": "ab2d99eedfd685ce685fa44e735695c27e946683", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.5679366074081922, "ground_truth": 0}, {"key": "ab2d99eedfd685ce685fa44e735695c27e946683", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.7295197799336656, "ground_truth": 0}, {"key": "ab2d99eedfd685ce685fa44e735695c27e946683", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.8615382062296476, "ground_truth": 0}, {"key": "df9c4e1b8698581720b28c71f1e98f82bd6ea6e6", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.5583269687495395, "ground_truth": 0}, {"key": "df9c4e1b8698581720b28c71f1e98f82bd6ea6e6", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.6424324795820979, "ground_truth": 0}, {"key": "df9c4e1b8698581720b28c71f1e98f82bd6ea6e6", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.46295860856750665, "ground_truth": 0}, {"key": "df9c4e1b8698581720b28c71f1e98f82bd6ea6e6", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.6095241678548406, "ground_truth": 0}, {"key": "df9c4e1b8698581720b28c71f1e98f82bd6ea6e6", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.4416730241618924, "ground_truth": 0}, {"key": "a1d7a119707506100920e1a6f0d9cbf4d4e7c838", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.575588004089058, "ground_truth": 0}, {"key": "a1d7a119707506100920e1a6f0d9cbf4d4e7c838", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.4301473234664629, "ground_truth": 0}, {"key": "a1d7a119707506100920e1a6f0d9cbf4d4e7c838", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.48828340385031893, "ground_truth": 0}, {"key": "a1d7a119707506100920e1a6f0d9cbf4d4e7c838", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.5234203439133752, "ground_truth": 0}, {"key": "a1d7a119707506100920e1a6f0d9cbf4d4e7c838", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.30074558898951975, "ground_truth": 0}, {"key": "acd2b851b367bf62dd603ebff5670ffa9c853a8f", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.3575675260883472, "ground_truth": 0}, {"key": "acd2b851b367bf62dd603ebff5670ffa9c853a8f", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.22000709539541324, "ground_truth": 0}, {"key": "acd2b851b367bf62dd603ebff5670ffa9c853a8f", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.44167301586330204, "ground_truth": 0}, {"key": "acd2b851b367bf62dd603ebff5670ffa9c853a8f", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.40733339271728136, "ground_truth": 0}, {"key": "acd2b851b367bf62dd603ebff5670ffa9c853a8f", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.42441200869121676, "ground_truth": 0}, {"key": "b9f5a02386adb698ae71cadd3fd1825fa7b998db", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.18242552498937742, "ground_truth": 0}, {"key": "b9f5a02386adb698ae71cadd3fd1825fa7b998db", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.30569733780259384, "ground_truth": 0}, {"key": "b9f5a02386adb698ae71cadd3fd1825fa7b998db", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.2160115258604088, "ground_truth": 0}, {"key": "b9f5a02386adb698ae71cadd3fd1825fa7b998db", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.11596071624826082, "ground_truth": 0}, {"key": "b9f5a02386adb698ae71cadd3fd1825fa7b998db", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.06656919053714874, "ground_truth": 0}, {"key": "c26f356dc536e5797ba550be6e27a95059f1ce53", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.3757064784130739, "ground_truth": 0}, {"key": "c26f356dc536e5797ba550be6e27a95059f1ce53", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.19806418545695173, "ground_truth": 0}, {"key": "c26f356dc536e5797ba550be6e27a95059f1ce53", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.27357438629764463, "ground_truth": 0}, {"key": "c26f356dc536e5797ba550be6e27a95059f1ce53", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.3539862956088522, "ground_truth": 0}, {"key": "c26f356dc536e5797ba550be6e27a95059f1ce53", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.2613309342816263, "ground_truth": 0}, {"key": "94a9883a283e94c3ad53069d98517b08e8853447", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.5640984643769671, "ground_truth": 0}, {"key": "94a9883a283e94c3ad53069d98517b08e8853447", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.8019358172354989, "ground_truth": 0}, {"key": "94a9883a283e94c3ad53069d98517b08e8853447", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.586996443370941, "ground_truth": 0}, {"key": "94a9883a283e94c3ad53069d98517b08e8853447", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.7341195373764441, "ground_truth": 0}, {"key": "94a9883a283e94c3ad53069d98517b08e8853447", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.858718575745786, "ground_truth": 0}, {"key": "9c02ebeda5d84859eb36070de7e8a9517ac3fee6", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.9367494759945436, "ground_truth": 0}, {"key": "9c02ebeda5d84859eb36070de7e8a9517ac3fee6", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.8558511447170886, "ground_truth": 0}, {"key": "9c02ebeda5d84859eb36070de7e8a9517ac3fee6", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.8221891277290958, "ground_truth": 0}, {"key": "9c02ebeda5d84859eb36070de7e8a9517ac3fee6", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.8509647031780233, "ground_truth": 0}, {"key": "9c02ebeda5d84859eb36070de7e8a9517ac3fee6", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.9403530581154322, "ground_truth": 0}, {"key": "37ab3a49bb7732e145a24e70e6f077469ca1dbd3", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.9324533070083972, "ground_truth": 0}, {"key": "37ab3a49bb7732e145a24e70e6f077469ca1dbd3", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.8499711796703757, "ground_truth": 0}, {"key": "37ab3a49bb7732e145a24e70e6f077469ca1dbd3", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.9099070001269378, "ground_truth": 0}, {"key": "37ab3a49bb7732e145a24e70e6f077469ca1dbd3", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.914290722548317, "ground_truth": 0}, {"key": "37ab3a49bb7732e145a24e70e6f077469ca1dbd3", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.9207896838614504, "ground_truth": 0}, {"key": "fa67b52d4597e227947776fd40a4b16f402ed12d", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.8606036114937362, "ground_truth": 0}, {"key": "fa67b52d4597e227947776fd40a4b16f402ed12d", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.667147672916876, "ground_truth": 0}, {"key": "fa67b52d4597e227947776fd40a4b16f402ed12d", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.607663162196705, "ground_truth": 0}, {"key": "fa67b52d4597e227947776fd40a4b16f402ed12d", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.7759445478381254, "ground_truth": 0}, {"key": "fa67b52d4597e227947776fd40a4b16f402ed12d", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.891811037869169, "ground_truth": 0}, {"key": "cafb6a9801a85984042abcd7e552d1e129dff4cf", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.6424324691278188, "ground_truth": 0}, {"key": "cafb6a9801a85984042abcd7e552d1e129dff4cf", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.5907791986366269, "ground_truth": 0}, {"key": "cafb6a9801a85984042abcd7e552d1e129dff4cf", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.5832033627056262, "ground_truth": 0}, {"key": "cafb6a9801a85984042abcd7e552d1e129dff4cf", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.42632158049666574, "ground_truth": 0}, {"key": "cafb6a9801a85984042abcd7e552d1e129dff4cf", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.7386690755574088, "ground_truth": 0}, {"key": "12a24b1aba082a5fd0687a14015e1e58090ed9c6", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.7248702597592218, "ground_truth": 0}, {"key": "12a24b1aba082a5fd0687a14015e1e58090ed9c6", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.37204877185021534, "ground_truth": 0}, {"key": "12a24b1aba082a5fd0687a14015e1e58090ed9c6", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.8104789200121819, "ground_truth": 0}, {"key": "12a24b1aba082a5fd0687a14015e1e58090ed9c6", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.7325918380770855, "ground_truth": 0}, {"key": "12a24b1aba082a5fd0687a14015e1e58090ed9c6", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.45519861477420087, "ground_truth": 0}, {"key": "c8ebf6f48257a704202c7b6df238bc1cbfa838d7", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.8044059127518915, "ground_truth": 0}, {"key": "c8ebf6f48257a704202c7b6df238bc1cbfa838d7", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.8529354695293991, "ground_truth": 0}, {"key": "c8ebf6f48257a704202c7b6df238bc1cbfa838d7", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.8068526350783609, "ground_truth": 0}, {"key": "c8ebf6f48257a704202c7b6df238bc1cbfa838d7", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.8688267772784556, "ground_truth": 0}, {"key": "c8ebf6f48257a704202c7b6df238bc1cbfa838d7", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.8092759433025755, "ground_truth": 0}, {"key": "48e858dcb8dd62aad328f2c5f7fa052893d7304b", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.4493926395417781, "ground_truth": 0}, {"key": "48e858dcb8dd62aad328f2c5f7fa052893d7304b", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.6654105664267359, "ground_truth": 0}, {"key": "48e858dcb8dd62aad328f2c5f7fa052893d7304b", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.6601723463956584, "ground_truth": 0}, {"key": "48e858dcb8dd62aad328f2c5f7fa052893d7304b", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.13117322642585275, "ground_truth": 0}, {"key": "48e858dcb8dd62aad328f2c5f7fa052893d7304b", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.6001883656138609, "ground_truth": 0}, {"key": "1522da440cb538c8fc60f254efcb65e8378065a1", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.8774767917803524, "ground_truth": 0}, {"key": "1522da440cb538c8fc60f254efcb65e8378065a1", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.8577681100607352, "ground_truth": 0}, {"key": "1522da440cb538c8fc60f254efcb65e8378065a1", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.7813306168610304, "ground_truth": 0}, {"key": "1522da440cb538c8fc60f254efcb65e8378065a1", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.6688802757401253, "ground_truth": 0}, {"key": "1522da440cb538c8fc60f254efcb65e8378065a1", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.7401743603977857, "ground_truth": 0}, {"key": "0b40c6061cfd6a745886150c46eb75a7f43b4efa", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.6723317038762961, "ground_truth": 0}, {"key": "0b40c6061cfd6a745886150c46eb75a7f43b4efa", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.7341195223174546, "ground_truth": 0}, {"key": "0b40c6061cfd6a745886150c46eb75a7f43b4efa", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.8044059059264123, "ground_truth": 0}, {"key": "0b40c6061cfd6a745886150c46eb75a7f43b4efa", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.705785041381547, "ground_truth": 0}, {"key": "0b40c6061cfd6a745886150c46eb75a7f43b4efa", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.8128673144559264, "ground_truth": 0}, {"key": "730655d5d1f29496344388805a891c3e3fd2a64e", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.8311430385816124, "ground_truth": 0}, {"key": "730655d5d1f29496344388805a891c3e3fd2a64e", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.702530053718198, "ground_truth": 0}, {"key": "730655d5d1f29496344388805a891c3e3fd2a64e", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.9353465070813752, "ground_truth": 0}, {"key": "730655d5d1f29496344388805a891c3e3fd2a64e", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.7534666682210476, "ground_truth": 0}, {"key": "730655d5d1f29496344388805a891c3e3fd2a64e", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.815232501807048, "ground_truth": 0}, {"key": "399877dd5e90d151e29ad67fdeb6fa093632e0e1", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.43974733605263217, "ground_truth": 0}, {"key": "399877dd5e90d151e29ad67fdeb6fa093632e0e1", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.515619897729626, "ground_truth": 0}, {"key": "399877dd5e90d151e29ad67fdeb6fa093632e0e1", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.5907791852249337, "ground_truth": 0}, {"key": "399877dd5e90d151e29ad67fdeb6fa093632e0e1", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.60766316379692, "ground_truth": 0}, {"key": "399877dd5e90d151e29ad67fdeb6fa093632e0e1", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.5869964264774205, "ground_truth": 0}, {"key": "67fc9fa49a2c443dcbab030b9c6247a662716bc9", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.5736784167697122, "ground_truth": 0}, {"key": "67fc9fa49a2c443dcbab030b9c6247a662716bc9", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.5448013961095602, "ground_truth": 0}, {"key": "67fc9fa49a2c443dcbab030b9c6247a662716bc9", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.3867634295390816, "ground_truth": 0}, {"key": "67fc9fa49a2c443dcbab030b9c6247a662716bc9", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.7041601269929254, "ground_truth": 0}, {"key": "67fc9fa49a2c443dcbab030b9c6247a662716bc9", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.6976089168037227, "ground_truth": 0}, {"key": "8a44f223fc67ed0d5f946517f77c2291d6c4a027", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.7759445490421268, "ground_truth": 0}, {"key": "8a44f223fc67ed0d5f946517f77c2291d6c4a027", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.8519528096600613, "ground_truth": 0}, {"key": "8a44f223fc67ed0d5f946517f77c2291d6c4a027", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.793105941482577, "ground_truth": 0}, {"key": "8a44f223fc67ed0d5f946517f77c2291d6c4a027", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.7341195283808419, "ground_truth": 0}, {"key": "8a44f223fc67ed0d5f946517f77c2291d6c4a027", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.8539127516193539, "ground_truth": 0}, {"key": "a3906e4f27942e2742d5cc9a3241980e338e0d30", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.8116760113403045, "ground_truth": 0}, {"key": "a3906e4f27942e2742d5cc9a3241980e338e0d30", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.6187804570395289, "ground_truth": 0}, {"key": "a3906e4f27942e2742d5cc9a3241980e338e0d30", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.6757645982769426, "ground_truth": 0}, {"key": "a3906e4f27942e2742d5cc9a3241980e338e0d30", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.6636689559049473, "ground_truth": 0}, {"key": "a3906e4f27942e2742d5cc9a3241980e338e0d30", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.5945512768960171, "ground_truth": 0}, {"key": "1e9f089602e8ab42ae65e273d866b53bdf9501bc", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.8679338522851512, "ground_truth": 0}, {"key": "1e9f089602e8ab42ae65e273d866b53bdf9501bc", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.8019358221267756, "ground_truth": 0}, {"key": "1e9f089602e8ab42ae65e273d866b53bdf9501bc", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.8688267829273967, "ground_truth": 0}, {"key": "1e9f089602e8ab42ae65e273d866b53bdf9501bc", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.8947894656362796, "ground_truth": 0}, {"key": "1e9f089602e8ab42ae65e273d866b53bdf9501bc", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.9039745131920811, "ground_truth": 0}, {"key": "768682d2f556e103bad77ad7aaa0660181747d1c", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.43398146967807494, "ground_truth": 0}, {"key": "768682d2f556e103bad77ad7aaa0660181747d1c", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.6113819934583992, "ground_truth": 0}, {"key": "768682d2f556e103bad77ad7aaa0660181747d1c", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.6477982228356232, "ground_truth": 0}, {"key": "768682d2f556e103bad77ad7aaa0660181747d1c", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.6424324714822428, "ground_truth": 0}, {"key": "768682d2f556e103bad77ad7aaa0660181747d1c", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.6774740189921241, "ground_truth": 0}, {"key": "2806f716e41ce224a3862eb2bc50e214bc5037d8", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.9324533031088936, "ground_truth": 0}, {"key": "2806f716e41ce224a3862eb2bc50e214bc5037d8", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.9309620679485517, "ground_truth": 0}, {"key": "2806f716e41ce224a3862eb2bc50e214bc5037d8", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.7248702868830182, "ground_truth": 0}, {"key": "2806f716e41ce224a3862eb2bc50e214bc5037d8", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.9549844666109646, "ground_truth": 0}, {"key": "2806f716e41ce224a3862eb2bc50e214bc5037d8", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.9219218347591162, "ground_truth": 0}, {"key": "49d1a193a2c477f5861b593f06681b35b0e49573", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.8783142481463267, "ground_truth": 0}, {"key": "49d1a193a2c477f5861b593f06681b35b0e49573", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.8633916223079479, "ground_truth": 0}, {"key": "49d1a193a2c477f5861b593f06681b35b0e49573", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.8558511573455292, "ground_truth": 0}, {"key": "49d1a193a2c477f5861b593f06681b35b0e49573", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.7813306201055562, "ground_truth": 0}, {"key": "49d1a193a2c477f5861b593f06681b35b0e49573", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.841825650476079, "ground_truth": 0}, {"key": "d603649af5260edbbe0474bcbb2e83e7340372d3", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.6531269367091037, "ground_truth": 0}, {"key": "d603649af5260edbbe0474bcbb2e83e7340372d3", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.5964331307015119, "ground_truth": 0}, {"key": "d603649af5260edbbe0474bcbb2e83e7340372d3", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.5428633094784974, "ground_truth": 0}, {"key": "d603649af5260edbbe0474bcbb2e83e7340372d3", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.8311430543832413, "ground_truth": 0}, {"key": "d603649af5260edbbe0474bcbb2e83e7340372d3", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.7090191427730798, "ground_truth": 0}, {"key": "241c3bfcde3e19fb8f0e5d0273ccb06155a2d86b", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.5117166005760773, "ground_truth": 0}, {"key": "241c3bfcde3e19fb8f0e5d0273ccb06155a2d86b", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.39233682897317784, "ground_truth": 0}, {"key": "241c3bfcde3e19fb8f0e5d0273ccb06155a2d86b", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.4054487264234292, "ground_truth": 0}, {"key": "241c3bfcde3e19fb8f0e5d0273ccb06155a2d86b", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.7217432161268361, "ground_truth": 0}, {"key": "241c3bfcde3e19fb8f0e5d0273ccb06155a2d86b", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.5983121770374736, "ground_truth": 0}, {"key": "cc8898d831bb770da703c284d4a811f16cb4035b", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.49414092714837354, "ground_truth": 0}, {"key": "cc8898d831bb770da703c284d4a811f16cb4035b", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.6315942856287569, "ground_truth": 0}, {"key": "cc8898d831bb770da703c284d4a811f16cb4035b", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.30735804243353393, "ground_truth": 0}, {"key": "cc8898d831bb770da703c284d4a811f16cb4035b", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.6057990682835246, "ground_truth": 0}, {"key": "cc8898d831bb770da703c284d4a811f16cb4035b", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.6706082951982293, "ground_truth": 0}, {"key": "e5685719d330bf84ed7691a9a591e04e6a6226b8", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.6671476662923149, "ground_truth": 0}, {"key": "e5685719d330bf84ed7691a9a591e04e6a6226b8", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.8080672257126744, "ground_truth": 0}, {"key": "e5685719d330bf84ed7691a9a591e04e6a6226b8", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.6636689551060541, "ground_truth": 0}, {"key": "e5685719d330bf84ed7691a9a591e04e6a6226b8", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.7718435133505692, "ground_truth": 0}, {"key": "e5685719d330bf84ed7691a9a591e04e6a6226b8", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.9425067189844721, "ground_truth": 0}, {"key": "bc868bcd37d2463875c4c685c582449069992a76", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.7490872099017032, "ground_truth": 0}, {"key": "bc868bcd37d2463875c4c685c582449069992a76", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.6723316887981391, "ground_truth": 0}, {"key": "bc868bcd37d2463875c4c685c582449069992a76", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.6370308028142657, "ground_truth": 0}, {"key": "bc868bcd37d2463875c4c685c582449069992a76", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.6808786102345535, "ground_truth": 0}, {"key": "bc868bcd37d2463875c4c685c582449069992a76", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.5506073564411622, "ground_truth": 0}, {"key": "c6369011986d295ce197e7304e14b207dab4c0aa", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.4863315253081229, "ground_truth": 0}, {"key": "c6369011986d295ce197e7304e14b207dab4c0aa", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.242205635142719, "ground_truth": 0}, {"key": "c6369011986d295ce197e7304e14b207dab4c0aa", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.7090191291095157, "ground_truth": 0}, {"key": "c6369011986d295ce197e7304e14b207dab4c0aa", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.32594952887447454, "ground_truth": 0}, {"key": "c6369011986d295ce197e7304e14b207dab4c0aa", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.38121957365966586, "ground_truth": 0}, {"key": "c4e4f565d15f76b1e367d4fc2e7a2648c3cd395c", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.2643583793368252, "ground_truth": 0}, {"key": "c4e4f565d15f76b1e367d4fc2e7a2648c3cd395c", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.42059960674178287, "ground_truth": 0}, {"key": "c4e4f565d15f76b1e367d4fc2e7a2648c3cd395c", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.20561505514762538, "ground_truth": 0}, {"key": "c4e4f565d15f76b1e367d4fc2e7a2648c3cd395c", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.41869691705123935, "ground_truth": 0}, {"key": "c4e4f565d15f76b1e367d4fc2e7a2648c3cd395c", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.3056973311078881, "ground_truth": 0}, {"key": "32fe9f0f2eedaf63c9fd0314ab92c4b46297e260", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.43398145737776916, "ground_truth": 0}, {"key": "32fe9f0f2eedaf63c9fd0314ab92c4b46297e260", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.5097643810985537, "ground_truth": 0}, {"key": "32fe9f0f2eedaf63c9fd0314ab92c4b46297e260", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.37754067956031795, "ground_truth": 0}, {"key": "32fe9f0f2eedaf63c9fd0314ab92c4b46297e260", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.3702253780291109, "ground_truth": 0}, {"key": "32fe9f0f2eedaf63c9fd0314ab92c4b46297e260", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.7813306290349825, "ground_truth": 0}, {"key": "41698f361bcf6415f711719ed0c2f6817205c091", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.889528860623608, "ground_truth": 0}, {"key": "41698f361bcf6415f711719ed0c2f6817205c091", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.8354835383807656, "ground_truth": 0}, {"key": "41698f361bcf6415f711719ed0c2f6817205c091", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.8140527962034838, "ground_truth": 0}, {"key": "41698f361bcf6415f711719ed0c2f6817205c091", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.8856314730944935, "ground_truth": 0}, {"key": "41698f361bcf6415f711719ed0c2f6817205c091", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.91964253203428, "ground_truth": 0}, {"key": "f040d657ee146cd131d34aeb31d6728b4f996666", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.44939263796604456, "ground_truth": 0}, {"key": "f040d657ee146cd131d34aeb31d6728b4f996666", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.309023705587114, "ground_truth": 0}, {"key": "f040d657ee146cd131d34aeb31d6728b4f996666", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.5117166230563746, "ground_truth": 0}, {"key": "f040d657ee146cd131d34aeb31d6728b4f996666", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.631594302259053, "ground_truth": 0}, {"key": "f040d657ee146cd131d34aeb31d6728b4f996666", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.43206339441601804, "ground_truth": 0}, {"key": "1823e1e750046606e4be0e8710f1d74998783e41", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.8587185922748047, "ground_truth": 0}, {"key": "1823e1e750046606e4be0e8710f1d74998783e41", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.8587185816365914, "ground_truth": 0}, {"key": "1823e1e750046606e4be0e8710f1d74998783e41", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.9329437116547126, "ground_truth": 0}, {"key": "1823e1e750046606e4be0e8710f1d74998783e41", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.9343951640916706, "ground_truth": 0}, {"key": "1823e1e750046606e4be0e8710f1d74998783e41", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.8887588048979865, "ground_truth": 0}, {"key": "6fae638166ee95509fbab3b28ac1c0ba0b088c79", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.5253688042900085, "ground_truth": 0}, {"key": "6fae638166ee95509fbab3b28ac1c0ba0b088c79", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.3174262801093454, "ground_truth": 0}, {"key": "6fae638166ee95509fbab3b28ac1c0ba0b088c79", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.42441198337479147, "ground_truth": 0}, {"key": "6fae638166ee95509fbab3b28ac1c0ba0b088c79", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.37570647110238004, "ground_truth": 0}, {"key": "6fae638166ee95509fbab3b28ac1c0ba0b088c79", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.3259495348363005, "ground_truth": 0}, {"key": "00be40289d0aea65afd2da6431db8a9fc8efc9c0", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.7918210645406987, "ground_truth": 0}, {"key": "00be40289d0aea65afd2da6431db8a9fc8efc9c0", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.45713672638096414, "ground_truth": 0}, {"key": "00be40289d0aea65afd2da6431db8a9fc8efc9c0", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.4167966384446125, "ground_truth": 0}, {"key": "00be40289d0aea65afd2da6431db8a9fc8efc9c0", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.3998116556792084, "ground_truth": 0}, {"key": "00be40289d0aea65afd2da6431db8a9fc8efc9c0", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.39047583405192837, "ground_truth": 0}, {"key": "50dc0ca6cbbd4f9c3761fbb3ad9e7d7ba85bd9b3", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.6943026692082145, "ground_truth": 0}, {"key": "50dc0ca6cbbd4f9c3761fbb3ad9e7d7ba85bd9b3", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.6842640243838125, "ground_truth": 0}, {"key": "50dc0ca6cbbd4f9c3761fbb3ad9e7d7ba85bd9b3", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.7025300450938046, "ground_truth": 0}, {"key": "50dc0ca6cbbd4f9c3761fbb3ad9e7d7ba85bd9b3", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.8539127549822617, "ground_truth": 0}, {"key": "50dc0ca6cbbd4f9c3761fbb3ad9e7d7ba85bd9b3", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.6279512346316768, "ground_truth": 0}, {"key": "28b0e5240a7c3088fc62a70628b146bb40b6b853", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.9235923229475249, "ground_truth": 0}, {"key": "28b0e5240a7c3088fc62a70628b146bb40b6b853", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.9136765234750797, "ground_truth": 0}, {"key": "28b0e5240a7c3088fc62a70628b146bb40b6b853", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.886420409793711, "ground_truth": 0}, {"key": "28b0e5240a7c3088fc62a70628b146bb40b6b853", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.8872046018079335, "ground_truth": 0}, {"key": "28b0e5240a7c3088fc62a70628b146bb40b6b853", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.970464663871787, "ground_truth": 0}, {"key": "44bdf9aa9712197110017fca533785653210f1ea", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.7606506794429945, "ground_truth": 0}, {"key": "44bdf9aa9712197110017fca533785653210f1ea", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.7690802421382764, "ground_truth": 0}, {"key": "44bdf9aa9712197110017fca533785653210f1ea", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.6859494522244662, "ground_truth": 0}, {"key": "44bdf9aa9712197110017fca533785653210f1ea", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.832236648340812, "ground_truth": 0}, {"key": "44bdf9aa9712197110017fca533785653210f1ea", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.6150878702912157, "ground_truth": 0}, {"key": "879e68a2b78b3cf3f5c2581bbf6093871143ed7b", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.8774767879910583, "ground_truth": 0}, {"key": "879e68a2b78b3cf3f5c2581bbf6093871143ed7b", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.770464801947093, "ground_truth": 0}, {"key": "879e68a2b78b3cf3f5c2581bbf6093871143ed7b", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.8848377677737421, "ground_truth": 0}, {"key": "879e68a2b78b3cf3f5c2581bbf6093871143ed7b", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.9353465161652086, "ground_truth": 0}, {"key": "879e68a2b78b3cf3f5c2581bbf6093871143ed7b", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.9569571488842766, "ground_truth": 0}, {"key": "980051ddbf137ec06e7aeead2acb598bae388520", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.6531269072126149, "ground_truth": 0}, {"key": "980051ddbf137ec06e7aeead2acb598bae388520", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.8140528158102677, "ground_truth": 0}, {"key": "980051ddbf137ec06e7aeead2acb598bae388520", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.8210441072783882, "ground_truth": 0}, {"key": "980051ddbf137ec06e7aeead2acb598bae388520", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.9178933658227875, "ground_truth": 0}, {"key": "980051ddbf137ec06e7aeead2acb598bae388520", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.8947894644707645, "ground_truth": 0}, {"key": "45b9fb89ac2724f2d7de56b2f8c9397bca03326e", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.7461389801952396, "ground_truth": 0}, {"key": "45b9fb89ac2724f2d7de56b2f8c9397bca03326e", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.5964331368447162, "ground_truth": 0}, {"key": "45b9fb89ac2724f2d7de56b2f8c9397bca03326e", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.6001883463244917, "ground_truth": 0}, {"key": "45b9fb89ac2724f2d7de56b2f8c9397bca03326e", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.5698526400904104, "ground_truth": 0}, {"key": "45b9fb89ac2724f2d7de56b2f8c9397bca03326e", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.6859494414044659, "ground_truth": 0}, {"key": "b427165e1be5e9b6e6067fc5f6591c02bfb93333", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.37570647723683764, "ground_truth": 0}, {"key": "b427165e1be5e9b6e6067fc5f6591c02bfb93333", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.47073660695983477, "ground_truth": 0}, {"key": "b427165e1be5e9b6e6067fc5f6591c02bfb93333", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.3433417426603421, "ground_truth": 0}, {"key": "b427165e1be5e9b6e6067fc5f6591c02bfb93333", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.5983121865633163, "ground_truth": 0}, {"key": "b427165e1be5e9b6e6067fc5f6591c02bfb93333", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.48438008060376325, "ground_truth": 0}, {"key": "a9a2880bd65c6b3835d19987ebcbd3d09010a0c3", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.44552952846255695, "ground_truth": 0}, {"key": "a9a2880bd65c6b3835d19987ebcbd3d09010a0c3", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.45326183694422967, "ground_truth": 0}, {"key": "a9a2880bd65c6b3835d19987ebcbd3d09010a0c3", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.5389831887204274, "ground_truth": 0}, {"key": "a9a2880bd65c6b3835d19987ebcbd3d09010a0c3", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.343341742299321, "ground_truth": 0}, {"key": "a9a2880bd65c6b3835d19987ebcbd3d09010a0c3", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.4882834125032282, "ground_truth": 0}, {"key": "0c67e8d5a91f3c7d9c53e29b8d0a25cf8db21b54", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.5660185262689945, "ground_truth": 0}, {"key": "0c67e8d5a91f3c7d9c53e29b8d0a25cf8db21b54", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.48633154981894233, "ground_truth": 0}, {"key": "0c67e8d5a91f3c7d9c53e29b8d0a25cf8db21b54", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.6842640195997124, "ground_truth": 0}, {"key": "0c67e8d5a91f3c7d9c53e29b8d0a25cf8db21b54", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.586996425666591, "ground_truth": 0}, {"key": "0c67e8d5a91f3c7d9c53e29b8d0a25cf8db21b54", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.7264256167340227, "ground_truth": 0}, {"key": "bc1c4d12aabdcecab3d87c6f9a898e41c7cd3821", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.8740772294458947, "ground_truth": 0}, {"key": "bc1c4d12aabdcecab3d87c6f9a898e41c7cd3821", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.9149009595268548, "ground_truth": 0}, {"key": "bc1c4d12aabdcecab3d87c6f9a898e41c7cd3821", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.9403530598762151, "ground_truth": 0}, {"key": "bc1c4d12aabdcecab3d87c6f9a898e41c7cd3821", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.7905303126839992, "ground_truth": 0}, {"key": "bc1c4d12aabdcecab3d87c6f9a898e41c7cd3821", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.7648916128233734, "ground_truth": 0}, {"key": "7b76a0b5e6006587b65ad70ac2e4953ca1e2d4d1", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.6513548604169115, "ground_truth": 0}, {"key": "7b76a0b5e6006587b65ad70ac2e4953ca1e2d4d1", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.5851011770892783, "ground_truth": 0}, {"key": "7b76a0b5e6006587b65ad70ac2e4953ca1e2d4d1", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.6477982369649892, "ground_truth": 0}, {"key": "7b76a0b5e6006587b65ad70ac2e4953ca1e2d4d1", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.7431680065685525, "ground_truth": 0}, {"key": "7b76a0b5e6006587b65ad70ac2e4953ca1e2d4d1", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.6076631923934169, "ground_truth": 0}, {"key": "8a0976b5b0811c919669e8aed7274e1d0fa14679", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.5331543892907895, "ground_truth": 0}, {"key": "8a0976b5b0811c919669e8aed7274e1d0fa14679", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.5175708910113322, "ground_truth": 0}, {"key": "8a0976b5b0811c919669e8aed7274e1d0fa14679", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.47268348040342917, "ground_truth": 0}, {"key": "8a0976b5b0811c919669e8aed7274e1d0fa14679", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.6076631570415175, "ground_truth": 0}, {"key": "8a0976b5b0811c919669e8aed7274e1d0fa14679", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.6150878568446131, "ground_truth": 0}, {"key": "69788d586d71bf36d2818ca097308747f6ab25ab", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.5312093865867854, "ground_truth": 0}, {"key": "69788d586d71bf36d2818ca097308747f6ab25ab", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.6825737192164316, "ground_truth": 0}, {"key": "69788d586d71bf36d2818ca097308747f6ab25ab", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.4571367384569726, "ground_truth": 0}, {"key": "69788d586d71bf36d2818ca097308747f6ab25ab", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.6150878359036638, "ground_truth": 0}, {"key": "69788d586d71bf36d2818ca097308747f6ab25ab", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.715423991033294, "ground_truth": 0}, {"key": "82e9c77478dfed129ceca1a152ba54e20f7f5a88", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.7648916104045443, "ground_truth": 0}, {"key": "82e9c77478dfed129ceca1a152ba54e20f7f5a88", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.5907792019841146, "ground_truth": 0}, {"key": "82e9c77478dfed129ceca1a152ba54e20f7f5a88", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.6442251249784048, "ground_truth": 0}, {"key": "82e9c77478dfed129ceca1a152ba54e20f7f5a88", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.6150878615769776, "ground_truth": 0}, {"key": "82e9c77478dfed129ceca1a152ba54e20f7f5a88", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.6723317042069169, "ground_truth": 0}, {"key": "e1b904fd0a3f74c3e01831acb6d4a67c0d1b642b", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.47852884818853414, "ground_truth": 0}, {"key": "e1b904fd0a3f74c3e01831acb6d4a67c0d1b642b", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.635222421173598, "ground_truth": 0}, {"key": "e1b904fd0a3f74c3e01831acb6d4a67c0d1b642b", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.5813030805134002, "ground_truth": 0}, {"key": "e1b904fd0a3f74c3e01831acb6d4a67c0d1b642b", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.4980468711467628, "ground_truth": 0}, {"key": "e1b904fd0a3f74c3e01831acb6d4a67c0d1b642b", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.5794004124285532, "ground_truth": 0}, {"key": "1cecb5f24805afcc15eb5cfa0500130f107c8bcb", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.2766905221032588, "ground_truth": 0}, {"key": "1cecb5f24805afcc15eb5cfa0500130f107c8bcb", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.19436780449922775, "ground_truth": 0}, {"key": "1cecb5f24805afcc15eb5cfa0500130f107c8bcb", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.22815649511162536, "ground_truth": 0}, {"key": "1cecb5f24805afcc15eb5cfa0500130f107c8bcb", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.34510526988259094, "ground_truth": 0}, {"key": "1cecb5f24805afcc15eb5cfa0500130f107c8bcb", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.6057990406137836, "ground_truth": 0}, {"key": "d3da69405b687367de6260d74db8726423b6884a", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.6671476647756649, "ground_truth": 0}, {"key": "d3da69405b687367de6260d74db8726423b6884a", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.8365545607711351, "ground_truth": 0}, {"key": "d3da69405b687367de6260d74db8726423b6884a", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.5983121983106022, "ground_truth": 0}, {"key": "d3da69405b687367de6260d74db8726423b6884a", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.5907792310584621, "ground_truth": 0}, {"key": "d3da69405b687367de6260d74db8726423b6884a", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.892562536139071, "ground_truth": 0}, {"key": "9b7836ba179053fecec671168589694bd4ba08f1", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.8558511508830996, "ground_truth": 0}, {"key": "9b7836ba179053fecec671168589694bd4ba08f1", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.8596637535382018, "ground_truth": 0}, {"key": "9b7836ba179053fecec671168589694bd4ba08f1", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.8807970822294442, "ground_truth": 0}, {"key": "9b7836ba179053fecec671168589694bd4ba08f1", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.845942439402025, "ground_truth": 0}, {"key": "9b7836ba179053fecec671168589694bd4ba08f1", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.8140527963433875, "ground_truth": 0}, {"key": "9483ae6d83dd71a96e91eee727a9ce7c0f3cf6ab", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.9674102564012198, "ground_truth": 0}, {"key": "9483ae6d83dd71a96e91eee727a9ce7c0f3cf6ab", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.9848109511156911, "ground_truth": 0}, {"key": "9483ae6d83dd71a96e91eee727a9ce7c0f3cf6ab", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.9833429602474995, "ground_truth": 0}, {"key": "9483ae6d83dd71a96e91eee727a9ce7c0f3cf6ab", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.9916195461299505, "ground_truth": 0}, {"key": "9483ae6d83dd71a96e91eee727a9ce7c0f3cf6ab", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.9768465913126274, "ground_truth": 0}, {"key": "ea29e498c303964fc39c856ddf7037d5dfbc93fb", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.4111108757286012, "ground_truth": 0}, {"key": "ea29e498c303964fc39c856ddf7037d5dfbc93fb", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.5621765021517502, "ground_truth": 0}, {"key": "ea29e498c303964fc39c856ddf7037d5dfbc93fb", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.5602526731262679, "ground_truth": 0}, {"key": "ea29e498c303964fc39c856ddf7037d5dfbc93fb", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.5234203409982656, "ground_truth": 0}, {"key": "ea29e498c303964fc39c856ddf7037d5dfbc93fb", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.5486734777034553, "ground_truth": 0}, {"key": "e1aad9da59a32a4443010b092eba1b68725c8467", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.7969253519423377, "ground_truth": 0}, {"key": "e1aad9da59a32a4443010b092eba1b68725c8467", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.720171507666198, "ground_truth": 0}, {"key": "e1aad9da59a32a4443010b092eba1b68725c8467", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.5774953540504553, "ground_truth": 0}, {"key": "e1aad9da59a32a4443010b092eba1b68725c8467", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.8311430428948445, "ground_truth": 0}, {"key": "e1aad9da59a32a4443010b092eba1b68725c8467", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.7431680203355159, "ground_truth": 0}, {"key": "6897f34c8e510dc95524dbfceefe20717776f761", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.6388352683396278, "ground_truth": 0}, {"key": "6897f34c8e510dc95524dbfceefe20717776f761", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.4960938253255362, "ground_truth": 0}, {"key": "6897f34c8e510dc95524dbfceefe20717776f761", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.19436781411024867, "ground_truth": 0}, {"key": "6897f34c8e510dc95524dbfceefe20717776f761", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.7490872036446853, "ground_truth": 0}, {"key": "6897f34c8e510dc95524dbfceefe20717776f761", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.7170118751571496, "ground_truth": 0}, {"key": "c0846f0148c9fd60433c8d2bf85e3437b49f9ec4", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.6566582949579509, "ground_truth": 0}, {"key": "c0846f0148c9fd60433c8d2bf85e3437b49f9ec4", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.5813030745622348, "ground_truth": 0}, {"key": "c0846f0148c9fd60433c8d2bf85e3437b49f9ec4", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.7233094708718522, "ground_truth": 0}, {"key": "c0846f0148c9fd60433c8d2bf85e3437b49f9ec4", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.6460136959166, "ground_truth": 0}, {"key": "c0846f0148c9fd60433c8d2bf85e3437b49f9ec4", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.6808786208477686, "ground_truth": 0}, {"key": "dfbb5a2d5844f89537141a2b5a48040e68327010", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.689305601956723, "ground_truth": 0}, {"key": "dfbb5a2d5844f89537141a2b5a48040e68327010", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.7772998583027725, "ground_truth": 0}, {"key": "dfbb5a2d5844f89537141a2b5a48040e68327010", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.6460136937305593, "ground_truth": 0}, {"key": "dfbb5a2d5844f89537141a2b5a48040e68327010", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.7264255956411007, "ground_truth": 0}, {"key": "dfbb5a2d5844f89537141a2b5a48040e68327010", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.7401743481663071, "ground_truth": 0}, {"key": "0aa0562353120d93357dc00a05ff4d2bc0312715", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.49414089980832254, "ground_truth": 0}, {"key": "0aa0562353120d93357dc00a05ff4d2bc0312715", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.43014735629622763, "ground_truth": 0}, {"key": "0aa0562353120d93357dc00a05ff4d2bc0312715", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.5078118783688306, "ground_truth": 0}, {"key": "0aa0562353120d93357dc00a05ff4d2bc0312715", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.5292633920867826, "ground_truth": 0}, {"key": "0aa0562353120d93357dc00a05ff4d2bc0312715", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.571766612054933, "ground_truth": 0}, {"key": "fd5ae29a3ed2e9093c12dcbb12fcb5c67217b0f5", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.5640984795793246, "ground_truth": 0}, {"key": "fd5ae29a3ed2e9093c12dcbb12fcb5c67217b0f5", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.4513265030935632, "ground_truth": 0}, {"key": "fd5ae29a3ed2e9093c12dcbb12fcb5c67217b0f5", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.4843800871800517, "ground_truth": 0}, {"key": "fd5ae29a3ed2e9093c12dcbb12fcb5c67217b0f5", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.38676343076650505, "ground_truth": 0}, {"key": "fd5ae29a3ed2e9093c12dcbb12fcb5c67217b0f5", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.5195213210810646, "ground_truth": 0}, {"key": "4df7a53f5e24347a53d5bf3b8c92bef21561f2c4", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.6057990550340205, "ground_truth": 0}, {"key": "4df7a53f5e24347a53d5bf3b8c92bef21561f2c4", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.5964331512112366, "ground_truth": 0}, {"key": "4df7a53f5e24347a53d5bf3b8c92bef21561f2c4", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.443600446902614, "ground_truth": 0}, {"key": "4df7a53f5e24347a53d5bf3b8c92bef21561f2c4", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.6548947383142708, "ground_truth": 0}, {"key": "4df7a53f5e24347a53d5bf3b8c92bef21561f2c4", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.7520125668437199, "ground_truth": 0}, {"key": "166fe0c3d3f400a48ec5fd716c675384512f152c", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.5058590971698624, "ground_truth": 0}, {"key": "166fe0c3d3f400a48ec5fd716c675384512f152c", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.5253688194792022, "ground_truth": 0}, {"key": "166fe0c3d3f400a48ec5fd716c675384512f152c", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.3468730768153711, "ground_truth": 0}, {"key": "166fe0c3d3f400a48ec5fd716c675384512f152c", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.29910518525444013, "ground_truth": 0}, {"key": "166fe0c3d3f400a48ec5fd716c675384512f152c", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.49609384010608326, "ground_truth": 0}, {"key": "69e313e0e6e7603f96a3783cb7d1ada68ace288f", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.9591542856769552, "ground_truth": 0}, {"key": "69e313e0e6e7603f96a3783cb7d1ada68ace288f", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.8509646977535612, "ground_truth": 0}, {"key": "69e313e0e6e7603f96a3783cb7d1ada68ace288f", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.7826624775896182, "ground_truth": 0}, {"key": "69e313e0e6e7603f96a3783cb7d1ada68ace288f", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.9339146238167351, "ground_truth": 0}, {"key": "69e313e0e6e7603f96a3783cb7d1ada68ace288f", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.7122321974718507, "ground_truth": 0}, {"key": "21ff7b91537b3ab2e73dff1f982a669b8658b0e9", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.7799929085943565, "ground_truth": 0}, {"key": "21ff7b91537b3ab2e73dff1f982a669b8658b0e9", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.6619228932686648, "ground_truth": 0}, {"key": "21ff7b91537b3ab2e73dff1f982a669b8658b0e9", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.8198933473136306, "ground_truth": 0}, {"key": "21ff7b91537b3ab2e73dff1f982a669b8658b0e9", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.7956581114101369, "ground_truth": 0}, {"key": "21ff7b91537b3ab2e73dff1f982a669b8658b0e9", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.7676898675930932, "ground_truth": 0}, {"key": "963cbc7820b42eaa7b7a82d178c6a387a70a6a3c", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.7461389792057903, "ground_truth": 0}, {"key": "963cbc7820b42eaa7b7a82d178c6a387a70a6a3c", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.656658266221647, "ground_truth": 0}, {"key": "963cbc7820b42eaa7b7a82d178c6a387a70a6a3c", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.697608922673096, "ground_truth": 0}, {"key": "963cbc7820b42eaa7b7a82d178c6a387a70a6a3c", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.8661325209277095, "ground_truth": 0}, {"key": "963cbc7820b42eaa7b7a82d178c6a387a70a6a3c", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.6992544278026432, "ground_truth": 0}, {"key": "8180a77657661e975e3fac6c7fdbd8de97fd160e", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.9536217946940887, "ground_truth": 0}, {"key": "8180a77657661e975e3fac6c7fdbd8de97fd160e", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.925229953544123, "ground_truth": 0}, {"key": "8180a77657661e975e3fac6c7fdbd8de97fd160e", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.9416541586453563, "ground_truth": 0}, {"key": "8180a77657661e975e3fac6c7fdbd8de97fd160e", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.8558511578314587, "ground_truth": 0}, {"key": "8180a77657661e975e3fac6c7fdbd8de97fd160e", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.9142907209406542, "ground_truth": 0}, {"key": "6c498fd6de7ad5e5006732655050c1d97cc2af68", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.6442251233605117, "ground_truth": 0}, {"key": "6c498fd6de7ad5e5006732655050c1d97cc2af68", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.5832033523191588, "ground_truth": 0}, {"key": "6c498fd6de7ad5e5006732655050c1d97cc2af68", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.5926665931921807, "ground_truth": 0}, {"key": "6c498fd6de7ad5e5006732655050c1d97cc2af68", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.592666610249604, "ground_truth": 0}, {"key": "6c498fd6de7ad5e5006732655050c1d97cc2af68", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.41489882886058665, "ground_truth": 0}, {"key": "fdb54e157f8f4e5a479dbc6288587e52fffde33f", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.405448727724419, "ground_truth": 0}, {"key": "fdb54e157f8f4e5a479dbc6288587e52fffde33f", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.4054487192041943, "ground_truth": 0}, {"key": "fdb54e157f8f4e5a479dbc6288587e52fffde33f", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.46490154961625757, "ground_truth": 0}, {"key": "fdb54e157f8f4e5a479dbc6288587e52fffde33f", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.649578627717296, "ground_truth": 0}, {"key": "fdb54e157f8f4e5a479dbc6288587e52fffde33f", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.462958608662924, "ground_truth": 0}, {"key": "fc8f0e54e2627ebe705735f0565d77ca64579d92", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.6388352836489458, "ground_truth": 0}, {"key": "fc8f0e54e2627ebe705735f0565d77ca64579d92", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.5583269671595522, "ground_truth": 0}, {"key": "fc8f0e54e2627ebe705735f0565d77ca64579d92", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.45519860483599134, "ground_truth": 0}, {"key": "fc8f0e54e2627ebe705735f0565d77ca64579d92", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.7356416393693812, "ground_truth": 0}, {"key": "fc8f0e54e2627ebe705735f0565d77ca64579d92", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.5945512825644437, "ground_truth": 0}, {"key": "b000d4eac990440e136dc1e655a03d5669531d9b", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.6206216214423493, "ground_truth": 0}, {"key": "b000d4eac990440e136dc1e655a03d5669531d9b", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.5389832030402746, "ground_truth": 0}, {"key": "b000d4eac990440e136dc1e655a03d5669531d9b", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.658417493451979, "ground_truth": 0}, {"key": "b000d4eac990440e136dc1e655a03d5669531d9b", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.2568319920076796, "ground_truth": 0}, {"key": "b000d4eac990440e136dc1e655a03d5669531d9b", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.6943026998360119, "ground_truth": 0}, {"key": "1064c47f3d7f0efa03368fe7eb01dd0836017339", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.6406358618393545, "ground_truth": 0}, {"key": "1064c47f3d7f0efa03368fe7eb01dd0836017339", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.626124179922225, "ground_truth": 0}, {"key": "1064c47f3d7f0efa03368fe7eb01dd0836017339", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.6442251229183419, "ground_truth": 0}, {"key": "1064c47f3d7f0efa03368fe7eb01dd0836017339", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.5774953906961926, "ground_truth": 0}, {"key": "1064c47f3d7f0efa03368fe7eb01dd0836017339", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.598312204957195, "ground_truth": 0}, {"key": "d79f1e9a2ddfcb61d80c944de53daebd4b5c7f6e", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.36296920679978556, "ground_truth": 0}, {"key": "d79f1e9a2ddfcb61d80c944de53daebd4b5c7f6e", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.740174370917953, "ground_truth": 0}, {"key": "d79f1e9a2ddfcb61d80c944de53daebd4b5c7f6e", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.48438007296197455, "ground_truth": 0}, {"key": "d79f1e9a2ddfcb61d80c944de53daebd4b5c7f6e", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.3593641440741693, "ground_truth": 0}, {"key": "d79f1e9a2ddfcb61d80c944de53daebd4b5c7f6e", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.7431679904723355, "ground_truth": 0}, {"key": "87b5f1f872c849ec239bad4ccf487d048d4274b2", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.931462508052674, "ground_truth": 0}, {"key": "87b5f1f872c849ec239bad4ccf487d048d4274b2", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.815232483377015, "ground_truth": 0}, {"key": "87b5f1f872c849ec239bad4ccf487d048d4274b2", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.8615382145654309, "ground_truth": 0}, {"key": "87b5f1f872c849ec239bad4ccf487d048d4274b2", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.8976953001119267, "ground_truth": 0}, {"key": "87b5f1f872c849ec239bad4ccf487d048d4274b2", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.8449215321942762, "ground_truth": 0}, {"key": "9ea6d6a5cae86243c1c8899f7bab76e874c73b38", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.5869964198610851, "ground_truth": 0}, {"key": "9ea6d6a5cae86243c1c8899f7bab76e874c73b38", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.4687906203119868, "ground_truth": 0}, {"key": "9ea6d6a5cae86243c1c8899f7bab76e874c73b38", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.4416729991195638, "ground_truth": 0}, {"key": "9ea6d6a5cae86243c1c8899f7bab76e874c73b38", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.44167303460784224, "ground_truth": 0}, {"key": "9ea6d6a5cae86243c1c8899f7bab76e874c73b38", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.8365545599089927, "ground_truth": 0}, {"key": "a3cb529364dbdcd2af9e30ecfe56898be375870b", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.615087856112391, "ground_truth": 0}, {"key": "a3cb529364dbdcd2af9e30ecfe56898be375870b", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.5926666083403239, "ground_truth": 0}, {"key": "a3cb529364dbdcd2af9e30ecfe56898be375870b", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.5640985115072537, "ground_truth": 0}, {"key": "a3cb529364dbdcd2af9e30ecfe56898be375870b", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.32766829679475257, "ground_truth": 0}, {"key": "a3cb529364dbdcd2af9e30ecfe56898be375870b", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.3539862883920904, "ground_truth": 0}, {"key": "f489b07406c653968a0ed21c00e28c9124e4a49b", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.9026096026245246, "ground_truth": 0}, {"key": "f489b07406c653968a0ed21c00e28c9124e4a49b", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.9284088036797966, "ground_truth": 0}, {"key": "f489b07406c653968a0ed21c00e28c9124e4a49b", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.9666631746062048, "ground_truth": 0}, {"key": "f489b07406c653968a0ed21c00e28c9124e4a49b", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.9235923096574123, "ground_truth": 0}, {"key": "f489b07406c653968a0ed21c00e28c9124e4a49b", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.9086178977774932, "ground_truth": 0}, {"key": "499fdb9bf024f6fbfd605792594372df22ec12f0", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.27669052885941764, "ground_truth": 0}, {"key": "499fdb9bf024f6fbfd605792594372df22ec12f0", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.4301473234664629, "ground_truth": 0}, {"key": "499fdb9bf024f6fbfd605792594372df22ec12f0", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.6584174915830482, "ground_truth": 0}, {"key": "499fdb9bf024f6fbfd605792594372df22ec12f0", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.4765796474317607, "ground_truth": 0}, {"key": "499fdb9bf024f6fbfd605792594372df22ec12f0", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.4016878080894879, "ground_truth": 0}, {"key": "9f49bf7ded4308f1601e4723d594d7c3b4883b32", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.8479677498736047, "ground_truth": 0}, {"key": "9f49bf7ded4308f1601e4723d594d7c3b4883b32", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.7233094739725323, "ground_truth": 0}, {"key": "9f49bf7ded4308f1601e4723d594d7c3b4883b32", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.7606506333255278, "ground_truth": 0}, {"key": "9f49bf7ded4308f1601e4723d594d7c3b4883b32", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.8019358323066277, "ground_truth": 0}, {"key": "9f49bf7ded4308f1601e4723d594d7c3b4883b32", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.9167080812561668, "ground_truth": 0}, {"key": "6bd843fe975d42b0f2d5eedb1a02d918e4a397f5", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.8128673121612447, "ground_truth": 0}, {"key": "6bd843fe975d42b0f2d5eedb1a02d918e4a397f5", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.8459424304314735, "ground_truth": 0}, {"key": "6bd843fe975d42b0f2d5eedb1a02d918e4a397f5", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.7662936410723461, "ground_truth": 0}, {"key": "6bd843fe975d42b0f2d5eedb1a02d918e4a397f5", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.8469578524541819, "ground_truth": 0}, {"key": "6bd843fe975d42b0f2d5eedb1a02d918e4a397f5", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.8749346078577044, "ground_truth": 0}, {"key": "00aa8e3ba59f5fe71a096a5549f80faece10aa83", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.6566582598429573, "ground_truth": 0}, {"key": "00aa8e3ba59f5fe71a096a5549f80faece10aa83", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.6706082814325649, "ground_truth": 0}, {"key": "00aa8e3ba59f5fe71a096a5549f80faece10aa83", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.7416740225103226, "ground_truth": 0}, {"key": "00aa8e3ba59f5fe71a096a5549f80faece10aa83", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.7476159529455684, "ground_truth": 0}, {"key": "00aa8e3ba59f5fe71a096a5549f80faece10aa83", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.6566582716423419, "ground_truth": 0}, {"key": "bf0ea0373655184f69fb01b9aa833d21e7188e9e", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.556399576046834, "ground_truth": 0}, {"key": "bf0ea0373655184f69fb01b9aa833d21e7188e9e", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.5019531348167023, "ground_truth": 0}, {"key": "bf0ea0373655184f69fb01b9aa833d21e7188e9e", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.556399587340636, "ground_truth": 0}, {"key": "bf0ea0373655184f69fb01b9aa833d21e7188e9e", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.46684561216388126, "ground_truth": 0}, {"key": "bf0ea0373655184f69fb01b9aa833d21e7188e9e", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.4571367167591725, "ground_truth": 0}, {"key": "e1afe080ecf3565b0103214c21f49e8b03741024", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.4960938592669087, "ground_truth": 0}, {"key": "e1afe080ecf3565b0103214c21f49e8b03741024", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.7786493151274521, "ground_truth": 0}, {"key": "e1afe080ecf3565b0103214c21f49e8b03741024", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.590779206760749, "ground_truth": 0}, {"key": "e1afe080ecf3565b0103214c21f49e8b03741024", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.7401743525967913, "ground_truth": 0}, {"key": "e1afe080ecf3565b0103214c21f49e8b03741024", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.5832033469245156, "ground_truth": 0}, {"key": "05fa6152f08a3d64745030124428775768ee3afd", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.5964331278537414, "ground_truth": 0}, {"key": "05fa6152f08a3d64745030124428775768ee3afd", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.8499711723686444, "ground_truth": 0}, {"key": "05fa6152f08a3d64745030124428775768ee3afd", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.8428631493893947, "ground_truth": 0}, {"key": "05fa6152f08a3d64745030124428775768ee3afd", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.8031737940644627, "ground_truth": 0}, {"key": "05fa6152f08a3d64745030124428775768ee3afd", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.7606506629515307, "ground_truth": 0}, {"key": "8f80054060e5c2dde57666b5e3bddf6b70b34f3f", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.7025300707534469, "ground_truth": 0}, {"key": "8f80054060e5c2dde57666b5e3bddf6b70b34f3f", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.6334102599548288, "ground_truth": 0}, {"key": "8f80054060e5c2dde57666b5e3bddf6b70b34f3f", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.7648916148231062, "ground_truth": 0}, {"key": "8f80054060e5c2dde57666b5e3bddf6b70b34f3f", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.590779223181798, "ground_truth": 0}, {"key": "8f80054060e5c2dde57666b5e3bddf6b70b34f3f", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.5214711777290915, "ground_truth": 0}, {"key": "f63877ffefceaf9a2a13a9277f4d861f9b9b8a73", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.7520125644674265, "ground_truth": 0}, {"key": "f63877ffefceaf9a2a13a9277f4d861f9b9b8a73", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.5945512326020107, "ground_truth": 0}, {"key": "f63877ffefceaf9a2a13a9277f4d861f9b9b8a73", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.7248702847558834, "ground_truth": 0}, {"key": "f63877ffefceaf9a2a13a9277f4d861f9b9b8a73", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.5389832135542921, "ground_truth": 0}, {"key": "f63877ffefceaf9a2a13a9277f4d861f9b9b8a73", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.7025300578093103, "ground_truth": 0}, {"key": "e1e0fbee1f5df559fda3830710afb660f33cb7b5", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.5869964264919552, "ground_truth": 0}, {"key": "e1e0fbee1f5df559fda3830710afb660f33cb7b5", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.5370413979845495, "ground_truth": 0}, {"key": "e1e0fbee1f5df559fda3830710afb660f33cb7b5", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.4378234985896796, "ground_truth": 0}, {"key": "e1e0fbee1f5df559fda3830710afb660f33cb7b5", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.6774740446118793, "ground_truth": 0}, {"key": "e1e0fbee1f5df559fda3830710afb660f33cb7b5", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.5331544021264365, "ground_truth": 0}, {"key": "7d66246dc75062c5616067bbb379962c3934e52f", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.5019531254635394, "ground_truth": 0}, {"key": "7d66246dc75062c5616067bbb379962c3934e52f", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.42441201898752434, "ground_truth": 0}, {"key": "7d66246dc75062c5616067bbb379962c3934e52f", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.40356688308970773, "ground_truth": 0}, {"key": "7d66246dc75062c5616067bbb379962c3934e52f", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.33285234118745566, "ground_truth": 0}, {"key": "7d66246dc75062c5616067bbb379962c3934e52f", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.4765796418571847, "ground_truth": 0}, {"key": "09e62b334425ef4eee26be483a625858c91340eb", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.5945512451395273, "ground_truth": 0}, {"key": "09e62b334425ef4eee26be483a625858c91340eb", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.6424324960113967, "ground_truth": 0}, {"key": "09e62b334425ef4eee26be483a625858c91340eb", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.7185943918749129, "ground_truth": 0}, {"key": "09e62b334425ef4eee26be483a625858c91340eb", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.7310585846601246, "ground_truth": 0}, {"key": "09e62b334425ef4eee26be483a625858c91340eb", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.6548947332807916, "ground_truth": 0}, {"key": "32e769b0ced3ffbf79f695af69a2401897156c8c", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.3468730941804788, "ground_truth": 0}, {"key": "32e769b0ced3ffbf79f695af69a2401897156c8c", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.5698526581849872, "ground_truth": 0}, {"key": "32e769b0ced3ffbf79f695af69a2401897156c8c", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.5679366067638318, "ground_truth": 0}, {"key": "32e769b0ced3ffbf79f695af69a2401897156c8c", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.5660185235949059, "ground_truth": 0}, {"key": "32e769b0ced3ffbf79f695af69a2401897156c8c", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.49804688474775183, "ground_truth": 0}, {"key": "43d42fe40ada4406377bc3b45c123a75552c21a0", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.3259495282469524, "ground_truth": 0}, {"key": "43d42fe40ada4406377bc3b45c123a75552c21a0", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.38676343234744714, "ground_truth": 0}, {"key": "43d42fe40ada4406377bc3b45c123a75552c21a0", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.618780433839114, "ground_truth": 0}, {"key": "43d42fe40ada4406377bc3b45c123a75552c21a0", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.6859494408717357, "ground_truth": 0}, {"key": "43d42fe40ada4406377bc3b45c123a75552c21a0", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.486331524567869, "ground_truth": 0}, {"key": "cec3e977a612e1481913d63934cfe578b9bcf3be", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.4785288235796346, "ground_truth": 0}, {"key": "cec3e977a612e1481913d63934cfe578b9bcf3be", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.5175708827051967, "ground_truth": 0}, {"key": "cec3e977a612e1481913d63934cfe578b9bcf3be", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.5907791962066492, "ground_truth": 0}, {"key": "cec3e977a612e1481913d63934cfe578b9bcf3be", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.46879062304807134, "ground_truth": 0}, {"key": "cec3e977a612e1481913d63934cfe578b9bcf3be", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.7041601213889838, "ground_truth": 0}, {"key": "2572185d9544f23c4ad02aeac1ae8ab7828fb4be", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.7279754382915682, "ground_truth": 0}, {"key": "2572185d9544f23c4ad02aeac1ae8ab7828fb4be", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.8824278734955043, "ground_truth": 0}, {"key": "2572185d9544f23c4ad02aeac1ae8ab7828fb4be", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.7233094499804478, "ground_truth": 0}, {"key": "2572185d9544f23c4ad02aeac1ae8ab7828fb4be", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.732591833574795, "ground_truth": 0}, {"key": "2572185d9544f23c4ad02aeac1ae8ab7828fb4be", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.7563575493585192, "ground_truth": 0}, {"key": "3cc7c9639fb87922cfac315fbb55641e671a3d99", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.5851011588477923, "ground_truth": 0}, {"key": "3cc7c9639fb87922cfac315fbb55641e671a3d99", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.5774953712335246, "ground_truth": 0}, {"key": "3cc7c9639fb87922cfac315fbb55641e671a3d99", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.5660185288663524, "ground_truth": 0}, {"key": "3cc7c9639fb87922cfac315fbb55641e671a3d99", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.6740504766734303, "ground_truth": 0}, {"key": "3cc7c9639fb87922cfac315fbb55641e671a3d99", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.5563995676662319, "ground_truth": 0}, {"key": "374ae10f9cbb0719c889321f880a0671892336e4", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.7476159682058048, "ground_truth": 0}, {"key": "374ae10f9cbb0719c889321f880a0671892336e4", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.8962513680793904, "ground_truth": 0}, {"key": "374ae10f9cbb0719c889321f880a0671892336e4", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.799442311334366, "ground_truth": 0}, {"key": "374ae10f9cbb0719c889321f880a0671892336e4", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.80563219574618, "ground_truth": 0}, {"key": "374ae10f9cbb0719c889321f880a0671892336e4", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.8365545537733104, "ground_truth": 0}, {"key": "89a7bb5a0b120c5b50e9145c8f8f9bea3a90371a", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.885631476408318, "ground_truth": 0}, {"key": "89a7bb5a0b120c5b50e9145c8f8f9bea3a90371a", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.7057850339725865, "ground_truth": 0}, {"key": "89a7bb5a0b120c5b50e9145c8f8f9bea3a90371a", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.8344068806960132, "ground_truth": 0}, {"key": "89a7bb5a0b120c5b50e9145c8f8f9bea3a90371a", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.8116760169123507, "ground_truth": 0}, {"key": "89a7bb5a0b120c5b50e9145c8f8f9bea3a90371a", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.8955226859984238, "ground_truth": 0}, {"key": "49d4ad731a44b7576e3e3271b1eee2f0219883c2", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.7446563438887158, "ground_truth": 0}, {"key": "49d4ad731a44b7576e3e3271b1eee2f0219883c2", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.7461390018338184, "ground_truth": 0}, {"key": "49d4ad731a44b7576e3e3271b1eee2f0219883c2", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.7325918333936678, "ground_truth": 0}, {"key": "49d4ad731a44b7576e3e3271b1eee2f0219883c2", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.5078118686957592, "ground_truth": 0}, {"key": "49d4ad731a44b7576e3e3271b1eee2f0219883c2", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.8104789074313459, "ground_truth": 0}, {"key": "ab3c9bac8bcfef89da719c4aba8ea4eee71e4daf", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.6352224375163169, "ground_truth": 0}, {"key": "ab3c9bac8bcfef89da719c4aba8ea4eee71e4daf", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.7520125599208893, "ground_truth": 0}, {"key": "ab3c9bac8bcfef89da719c4aba8ea4eee71e4daf", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.6388352777747637, "ground_truth": 0}, {"key": "ab3c9bac8bcfef89da719c4aba8ea4eee71e4daf", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.8019358249584585, "ground_truth": 0}, {"key": "ab3c9bac8bcfef89da719c4aba8ea4eee71e4daf", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.7356416428795153, "ground_truth": 0}, {"key": "eb8b1cf7cf4ab7ad23ef6094cfe69348563aecc8", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.6113819715167723, "ground_truth": 0}, {"key": "eb8b1cf7cf4ab7ad23ef6094cfe69348563aecc8", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.5832033505030294, "ground_truth": 0}, {"key": "eb8b1cf7cf4ab7ad23ef6094cfe69348563aecc8", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.6224593270639837, "ground_truth": 0}, {"key": "eb8b1cf7cf4ab7ad23ef6094cfe69348563aecc8", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.7648916208797436, "ground_truth": 0}, {"key": "eb8b1cf7cf4ab7ad23ef6094cfe69348563aecc8", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.6076631629040179, "ground_truth": 0}, {"key": "e944a5cbd4265e43f422c172b930a60b7de190cc", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.46490157124217635, "ground_truth": 0}, {"key": "e944a5cbd4265e43f422c172b930a60b7de190cc", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.37387581189188157, "ground_truth": 0}, {"key": "e944a5cbd4265e43f422c172b930a60b7de190cc", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.15921741008414622, "ground_truth": 0}, {"key": "e944a5cbd4265e43f422c172b930a60b7de190cc", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.19559407121354858, "ground_truth": 0}, {"key": "e944a5cbd4265e43f422c172b930a60b7de190cc", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.22815649575822125, "ground_truth": 0}, {"key": "ef96a6c54daaf4fef676a69305e26fa1d4788bdd", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.6548947388810276, "ground_truth": 0}, {"key": "ef96a6c54daaf4fef676a69305e26fa1d4788bdd", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.7956580972342081, "ground_truth": 0}, {"key": "ef96a6c54daaf4fef676a69305e26fa1d4788bdd", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.6113819565888283, "ground_truth": 0}, {"key": "ef96a6c54daaf4fef676a69305e26fa1d4788bdd", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.7690802411809811, "ground_truth": 0}, {"key": "ef96a6c54daaf4fef676a69305e26fa1d4788bdd", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.7606506692036441, "ground_truth": 0}, {"key": "d9ec8c3e50de1d5af4524c26c6819e17b64090aa", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.3363310324564509, "ground_truth": 0}, {"key": "d9ec8c3e50de1d5af4524c26c6819e17b64090aa", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.4474602634532362, "ground_truth": 0}, {"key": "d9ec8c3e50de1d5af4524c26c6819e17b64090aa", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.3757064559100789, "ground_truth": 0}, {"key": "d9ec8c3e50de1d5af4524c26c6819e17b64090aa", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.36658974587059356, "ground_truth": 0}, {"key": "d9ec8c3e50de1d5af4524c26c6819e17b64090aa", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.40544874436131334, "ground_truth": 0}, {"key": "b6072611b97e8c19ba2d7e0dfce153f046dd629d", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.5370413811138167, "ground_truth": 0}, {"key": "b6072611b97e8c19ba2d7e0dfce153f046dd629d", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.3140505567494199, "ground_truth": 0}, {"key": "b6072611b97e8c19ba2d7e0dfce153f046dd629d", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.39606816827650193, "ground_truth": 0}, {"key": "b6072611b97e8c19ba2d7e0dfce153f046dd629d", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.5078118590586469, "ground_truth": 0}, {"key": "b6072611b97e8c19ba2d7e0dfce153f046dd629d", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.5851011202407332, "ground_truth": 0}, {"key": "2cf81cee664ebcb027a48259e34e512a79aceecb", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.7356416570628048, "ground_truth": 0}, {"key": "2cf81cee664ebcb027a48259e34e512a79aceecb", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.7386691044856314, "ground_truth": 0}, {"key": "2cf81cee664ebcb027a48259e34e512a79aceecb", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.7662936490249271, "ground_truth": 0}, {"key": "2cf81cee664ebcb027a48259e34e512a79aceecb", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.8128673019002933, "ground_truth": 0}, {"key": "2cf81cee664ebcb027a48259e34e512a79aceecb", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.7879312073092508, "ground_truth": 0}, {"key": "b037b44fc06a2d89d95dc7b4453b87371a34fe2f", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.8233284190676682, "ground_truth": 0}, {"key": "b037b44fc06a2d89d95dc7b4453b87371a34fe2f", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.7057850339725865, "ground_truth": 0}, {"key": "b037b44fc06a2d89d95dc7b4453b87371a34fe2f", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.7648916163343552, "ground_truth": 0}, {"key": "b037b44fc06a2d89d95dc7b4453b87371a34fe2f", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.6039318271283661, "ground_truth": 0}, {"key": "b037b44fc06a2d89d95dc7b4453b87371a34fe2f", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.7563575491727073, "ground_truth": 0}, {"key": "b1ea881f21e2b58e247b5894d4f259cf86b4d1dd", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.8233283926145841, "ground_truth": 0}, {"key": "b1ea881f21e2b58e247b5894d4f259cf86b4d1dd", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.41300354732449546, "ground_truth": 0}, {"key": "b1ea881f21e2b58e247b5894d4f259cf86b4d1dd", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.45132651906772614, "ground_truth": 0}, {"key": "b1ea881f21e2b58e247b5894d4f259cf86b4d1dd", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.49023562851652214, "ground_truth": 0}, {"key": "b1ea881f21e2b58e247b5894d4f259cf86b4d1dd", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.8499711778499821, "ground_truth": 0}, {"key": "d80e6a3be826df05df00a87f49cc426fd597f085", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.9704646635906822, "ground_truth": 0}, {"key": "d80e6a3be826df05df00a87f49cc426fd597f085", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.9511422198845937, "ground_truth": 0}, {"key": "d80e6a3be826df05df00a87f49cc426fd597f085", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.962673111808647, "ground_truth": 0}, {"key": "d80e6a3be826df05df00a87f49cc426fd597f085", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.9591542845523577, "ground_truth": 0}, {"key": "d80e6a3be826df05df00a87f49cc426fd597f085", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.9623913639236574, "ground_truth": 0}, {"key": "05216d3837745866d393f0e07be7ba801dc330f6", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.7931059617747267, "ground_truth": 0}, {"key": "05216d3837745866d393f0e07be7ba801dc330f6", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.8267117946105932, "ground_truth": 0}, {"key": "05216d3837745866d393f0e07be7ba801dc330f6", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.889528851781483, "ground_truth": 0}, {"key": "05216d3837745866d393f0e07be7ba801dc330f6", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.8998277754890444, "ground_truth": 0}, {"key": "05216d3837745866d393f0e07be7ba801dc330f6", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.9178933682734958, "ground_truth": 0}, {"key": "a204e3551445183cf53ae355e532a2db731c0c30", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.6740504687928008, "ground_truth": 0}, {"key": "a204e3551445183cf53ae355e532a2db731c0c30", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.40922079379677917, "ground_truth": 0}, {"key": "a204e3551445183cf53ae355e532a2db731c0c30", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.721743202779477, "ground_truth": 0}, {"key": "a204e3551445183cf53ae355e532a2db731c0c30", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.5945512796925021, "ground_truth": 0}, {"key": "a204e3551445183cf53ae355e532a2db731c0c30", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.5506073526794703, "ground_truth": 0}, {"key": "047e7bc4c7ea5f7df08d4efc443ac8a3479649f1", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.8902942230183774, "ground_truth": 0}, {"key": "047e7bc4c7ea5f7df08d4efc443ac8a3479649f1", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.9319595831418811, "ground_truth": 0}, {"key": "047e7bc4c7ea5f7df08d4efc443ac8a3479649f1", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.8688267728634425, "ground_truth": 0}, {"key": "047e7bc4c7ea5f7df08d4efc443ac8a3479649f1", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.9353465144538481, "ground_truth": 0}, {"key": "047e7bc4c7ea5f7df08d4efc443ac8a3479649f1", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.8749346169180542, "ground_truth": 0}, {"key": "dee467e11f253e70ec843c45fb373da06eace6be", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.8774767835686087, "ground_truth": 0}, {"key": "dee467e11f253e70ec843c45fb373da06eace6be", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.9799765561323267, "ground_truth": 0}, {"key": "dee467e11f253e70ec843c45fb373da06eace6be", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.930458257806077, "ground_truth": 0}, {"key": "dee467e11f253e70ec843c45fb373da06eace6be", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.9653811582058471, "ground_truth": 0}, {"key": "dee467e11f253e70ec843c45fb373da06eace6be", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.9319595813085829, "ground_truth": 0}, {"key": "054891b9199a73152564cc5be925250ea282bb00", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.4649015539651695, "ground_truth": 0}, {"key": "054891b9199a73152564cc5be925250ea282bb00", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.35756752949858206, "ground_truth": 0}, {"key": "054891b9199a73152564cc5be925250ea282bb00", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.34864512669380465, "ground_truth": 0}, {"key": "054891b9199a73152564cc5be925250ea282bb00", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.312370010145675, "ground_truth": 0}, {"key": "054891b9199a73152564cc5be925250ea282bb00", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.40733341134190193, "ground_truth": 0}, {"key": "82a94cf607660eb67aac057e3f5028c4cae75abf", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.7759445500616783, "ground_truth": 0}, {"key": "82a94cf607660eb67aac057e3f5028c4cae75abf", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.47852882684106196, "ground_truth": 0}, {"key": "82a94cf607660eb67aac057e3f5028c4cae75abf", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.5621765056872038, "ground_truth": 0}, {"key": "82a94cf607660eb67aac057e3f5028c4cae75abf", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.7648916089271041, "ground_truth": 0}, {"key": "82a94cf607660eb67aac057e3f5028c4cae75abf", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.7279754554282516, "ground_truth": 0}, {"key": "58bf14c936eb7e9a6561599014fefd77ef6c457e", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.8577681067658188, "ground_truth": 0}, {"key": "58bf14c936eb7e9a6561599014fefd77ef6c457e", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.7057850362519893, "ground_truth": 0}, {"key": "58bf14c936eb7e9a6561599014fefd77ef6c457e", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.8300437629271293, "ground_truth": 0}, {"key": "58bf14c936eb7e9a6561599014fefd77ef6c457e", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.8418256430884402, "ground_truth": 0}, {"key": "58bf14c936eb7e9a6561599014fefd77ef6c457e", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.7826624875346807, "ground_truth": 0}, {"key": "5574fe023e3127f0c206ac89eb06abf5a7400438", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.37204879371285654, "ground_truth": 0}, {"key": "5574fe023e3127f0c206ac89eb06abf5a7400438", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.21601153207237694, "ground_truth": 0}, {"key": "5574fe023e3127f0c206ac89eb06abf5a7400438", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.19436782668059208, "ground_truth": 0}, {"key": "5574fe023e3127f0c206ac89eb06abf5a7400438", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.2861692550069042, "ground_truth": 0}, {"key": "5574fe023e3127f0c206ac89eb06abf5a7400438", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.1510278082289862, "ground_truth": 0}, {"key": "e88be1fa30cb6557d422788b5c469b7ba7ca8bfc", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.726425605100585, "ground_truth": 0}, {"key": "e88be1fa30cb6557d422788b5c469b7ba7ca8bfc", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.7676898498554122, "ground_truth": 0}, {"key": "e88be1fa30cb6557d422788b5c469b7ba7ca8bfc", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.3276683036690099, "ground_truth": 0}, {"key": "e88be1fa30cb6557d422788b5c469b7ba7ca8bfc", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.8175744709696627, "ground_truth": 0}, {"key": "e88be1fa30cb6557d422788b5c469b7ba7ca8bfc", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.743167997931486, "ground_truth": 0}, {"key": "62f05476ec5198ceb345ce4f45d7d0e70f499ad7", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.42059957765833106, "ground_truth": 0}, {"key": "62f05476ec5198ceb345ce4f45d7d0e70f499ad7", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.544801381951984, "ground_truth": 0}, {"key": "62f05476ec5198ceb345ce4f45d7d0e70f499ad7", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.3684057102545348, "ground_truth": 0}, {"key": "62f05476ec5198ceb345ce4f45d7d0e70f499ad7", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.46684559392695235, "ground_truth": 0}, {"key": "62f05476ec5198ceb345ce4f45d7d0e70f499ad7", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.4765796611809923, "ground_truth": 0}, {"key": "8cc719f761556a81a71c2dd1b703749c2059df10", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.7090191224141783, "ground_truth": 0}, {"key": "8cc719f761556a81a71c2dd1b703749c2059df10", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.8887587953306102, "ground_truth": 0}, {"key": "8cc719f761556a81a71c2dd1b703749c2059df10", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.7879311926443687, "ground_truth": 0}, {"key": "8cc719f761556a81a71c2dd1b703749c2059df10", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.5156198996309259, "ground_truth": 0}, {"key": "8cc719f761556a81a71c2dd1b703749c2059df10", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.7577943773325791, "ground_truth": 0}, {"key": "2d89b0d0827a0a1e9e855de7717407cdff63b1f5", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.39420093250933613, "ground_truth": 0}, {"key": "2d89b0d0827a0a1e9e855de7717407cdff63b1f5", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.48242913776665935, "ground_truth": 0}, {"key": "2d89b0d0827a0a1e9e855de7717407cdff63b1f5", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.4629585972595569, "ground_truth": 0}, {"key": "2d89b0d0827a0a1e9e855de7717407cdff63b1f5", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.4921881615547386, "ground_truth": 0}, {"key": "2d89b0d0827a0a1e9e855de7717407cdff63b1f5", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.31573595647921443, "ground_truth": 0}, {"key": "41431356e1e7c6f94057b262cd284987f9edb184", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.4785288295684704, "ground_truth": 0}, {"key": "41431356e1e7c6f94057b262cd284987f9edb184", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.47463120755747196, "ground_truth": 0}, {"key": "41431356e1e7c6f94057b262cd284987f9edb184", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.453261841289774, "ground_truth": 0}, {"key": "41431356e1e7c6f94057b262cd284987f9edb184", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.6926419831207627, "ground_truth": 0}, {"key": "41431356e1e7c6f94057b262cd284987f9edb184", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.3007455827580389, "ground_truth": 0}, {"key": "50872fa30632af8f4c65fb9f952ea8e1b13043c9", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.5370413801510283, "ground_truth": 0}, {"key": "50872fa30632af8f4c65fb9f952ea8e1b13043c9", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.35936415076536515, "ground_truth": 0}, {"key": "50872fa30632af8f4c65fb9f952ea8e1b13043c9", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.622459328990589, "ground_truth": 0}, {"key": "50872fa30632af8f4c65fb9f952ea8e1b13043c9", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.6352224235461192, "ground_truth": 0}, {"key": "50872fa30632af8f4c65fb9f952ea8e1b13043c9", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.5525397028757583, "ground_truth": 0}, {"key": "4a403faad8116c40f4cb960d3ffad081106341ad", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.474631164391314, "ground_truth": 0}, {"key": "4a403faad8116c40f4cb960d3ffad081106341ad", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.4073334101640819, "ground_truth": 0}, {"key": "4a403faad8116c40f4cb960d3ffad081106341ad", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.14804718551328344, "ground_truth": 0}, {"key": "4a403faad8116c40f4cb960d3ffad081106341ad", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.24508501130743962, "ground_truth": 0}, {"key": "4a403faad8116c40f4cb960d3ffad081106341ad", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.5370413884195696, "ground_truth": 0}, {"key": "6f6964470c122807573653173b45b8e00bb59696", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.8322366533243882, "ground_truth": 0}, {"key": "6f6964470c122807573653173b45b8e00bb59696", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.5019530920789922, "ground_truth": 0}, {"key": "6f6964470c122807573653173b45b8e00bb59696", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.8459424323247067, "ground_truth": 0}, {"key": "6f6964470c122807573653173b45b8e00bb59696", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.8670357617123439, "ground_truth": 0}, {"key": "6f6964470c122807573653173b45b8e00bb59696", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.7905303104624147, "ground_truth": 0}, {"key": "75c6e27a38b72bb9f75fa2b8e45e933bae10dac5", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.6566582762475117, "ground_truth": 0}, {"key": "75c6e27a38b72bb9f75fa2b8e45e933bae10dac5", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.7341195296815709, "ground_truth": 0}, {"key": "75c6e27a38b72bb9f75fa2b8e45e933bae10dac5", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.43014734557702583, "ground_truth": 0}, {"key": "75c6e27a38b72bb9f75fa2b8e45e933bae10dac5", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.7563575587561047, "ground_truth": 0}, {"key": "75c6e27a38b72bb9f75fa2b8e45e933bae10dac5", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.7371581493613223, "ground_truth": 0}, {"key": "9aa6463127d1efcba4403a185b29849a3688db8d", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.7490872044101987, "ground_truth": 0}, {"key": "9aa6463127d1efcba4403a185b29849a3688db8d", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.6424324665802237, "ground_truth": 0}, {"key": "9aa6463127d1efcba4403a185b29849a3688db8d", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.7138307421238683, "ground_truth": 0}, {"key": "9aa6463127d1efcba4403a185b29849a3688db8d", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.5907792326815542, "ground_truth": 0}, {"key": "9aa6463127d1efcba4403a185b29849a3688db8d", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.7325918465514049, "ground_truth": 0}, {"key": "97eda06b374f07cd9495962465775bde7d44da31", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.3593641349571789, "ground_truth": 0}, {"key": "97eda06b374f07cd9495962465775bde7d44da31", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.42632160031471, "ground_truth": 0}, {"key": "97eda06b374f07cd9495962465775bde7d44da31", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.6388352952878791, "ground_truth": 0}, {"key": "97eda06b374f07cd9495962465775bde7d44da31", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.4863315450198507, "ground_truth": 0}, {"key": "97eda06b374f07cd9495962465775bde7d44da31", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.38121957252929883, "ground_truth": 0}, {"key": "99a6049d67c1cee35f9703ccb8e6f62a4928295a", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.6513548620489009, "ground_truth": 0}, {"key": "99a6049d67c1cee35f9703ccb8e6f62a4928295a", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.2766905330078096, "ground_truth": 0}, {"key": "99a6049d67c1cee35f9703ccb8e6f62a4928295a", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.20689406168879806, "ground_truth": 0}, {"key": "99a6049d67c1cee35f9703ccb8e6f62a4928295a", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.3812195737969591, "ground_truth": 0}, {"key": "99a6049d67c1cee35f9703ccb8e6f62a4928295a", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.5486734742068975, "ground_truth": 0}, {"key": "adcb3e7b4bef0f9efe7a838b56131ca99b587743", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.45326185392996143, "ground_truth": 0}, {"key": "adcb3e7b4bef0f9efe7a838b56131ca99b587743", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.20817892404707297, "ground_truth": 0}, {"key": "adcb3e7b4bef0f9efe7a838b56131ca99b587743", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.3647775647518042, "ground_truth": 0}, {"key": "adcb3e7b4bef0f9efe7a838b56131ca99b587743", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.45713671660908206, "ground_truth": 0}, {"key": "adcb3e7b4bef0f9efe7a838b56131ca99b587743", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.45713671840212466, "ground_truth": 0}, {"key": "bf7cc4e7872b7471a8ef858b8aa45eca090171da", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.5253688344253471, "ground_truth": 0}, {"key": "bf7cc4e7872b7471a8ef858b8aa45eca090171da", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.5813030738073619, "ground_truth": 0}, {"key": "bf7cc4e7872b7471a8ef858b8aa45eca090171da", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.6636689445307684, "ground_truth": 0}, {"key": "bf7cc4e7872b7471a8ef858b8aa45eca090171da", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.7154240007868755, "ground_truth": 0}, {"key": "bf7cc4e7872b7471a8ef858b8aa45eca090171da", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.44167301459055464, "ground_truth": 0}, {"key": "62785b99e4007fad95ce55d427046e14aef476a4", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.3960681553591007, "ground_truth": 0}, {"key": "62785b99e4007fad95ce55d427046e14aef476a4", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.4244119970670773, "ground_truth": 0}, {"key": "62785b99e4007fad95ce55d427046e14aef476a4", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.28616922125418737, "ground_truth": 0}, {"key": "62785b99e4007fad95ce55d427046e14aef476a4", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.7008948111762835, "ground_truth": 0}, {"key": "62785b99e4007fad95ce55d427046e14aef476a4", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.45326186543387365, "ground_truth": 0}, {"key": "62fcd4ca096a182c292ae3609444bbc7af15eab6", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.8140528073522618, "ground_truth": 0}, {"key": "62fcd4ca096a182c292ae3609444bbc7af15eab6", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.6020615745001109, "ground_truth": 0}, {"key": "62fcd4ca096a182c292ae3609444bbc7af15eab6", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.47073659737907153, "ground_truth": 0}, {"key": "62fcd4ca096a182c292ae3609444bbc7af15eab6", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.7090191383020997, "ground_truth": 0}, {"key": "62fcd4ca096a182c292ae3609444bbc7af15eab6", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.4882833998699457, "ground_truth": 0}, {"key": "afdbd1bc7c79a936601b3c6cae4622464641d3a5", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.6513548429219652, "ground_truth": 0}, {"key": "afdbd1bc7c79a936601b3c6cae4622464641d3a5", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.7264256124366953, "ground_truth": 0}, {"key": "afdbd1bc7c79a936601b3c6cae4622464641d3a5", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.6279512056912848, "ground_truth": 0}, {"key": "afdbd1bc7c79a936601b3c6cae4622464641d3a5", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.8140527846236625, "ground_truth": 0}, {"key": "afdbd1bc7c79a936601b3c6cae4622464641d3a5", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.746138991619623, "ground_truth": 0}, {"key": "2a2a0fd7b85ec6f9145761795bae420d7eb84f44", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.6224593249875267, "ground_truth": 0}, {"key": "2a2a0fd7b85ec6f9145761795bae420d7eb84f44", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.6352224052473306, "ground_truth": 0}, {"key": "2a2a0fd7b85ec6f9145761795bae420d7eb84f44", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.5755880418461177, "ground_truth": 0}, {"key": "2a2a0fd7b85ec6f9145761795bae420d7eb84f44", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.8019358273664605, "ground_truth": 0}, {"key": "2a2a0fd7b85ec6f9145761795bae420d7eb84f44", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.5292634042472556, "ground_truth": 0}, {"key": "f3d07208d0059d738fc7788a4ce813309b677d7b", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.7248702805077533, "ground_truth": 0}, {"key": "f3d07208d0059d738fc7788a4ce813309b677d7b", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.7341195218072886, "ground_truth": 0}, {"key": "f3d07208d0059d738fc7788a4ce813309b677d7b", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.6740504618913945, "ground_truth": 0}, {"key": "f3d07208d0059d738fc7788a4ce813309b677d7b", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.7592254123693191, "ground_truth": 0}, {"key": "f3d07208d0059d738fc7788a4ce813309b677d7b", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.5888891399476165, "ground_truth": 0}, {"key": "2b8840981769a4a8f93d2e82e609ab169165cd3c", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.4339814780640991, "ground_truth": 0}, {"key": "2b8840981769a4a8f93d2e82e609ab169165cd3c", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.7386690872811379, "ground_truth": 0}, {"key": "2b8840981769a4a8f93d2e82e609ab169165cd3c", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.7264256141233287, "ground_truth": 0}, {"key": "2b8840981769a4a8f93d2e82e609ab169165cd3c", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.5832033662030538, "ground_truth": 0}, {"key": "2b8840981769a4a8f93d2e82e609ab169165cd3c", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.7106283049589431, "ground_truth": 0}, {"key": "4b23ce1db7253bf118b493c9bea7d6899012cc88", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.2814056140697072, "ground_truth": 0}, {"key": "4b23ce1db7253bf118b493c9bea7d6899012cc88", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.6095241735901623, "ground_truth": 0}, {"key": "4b23ce1db7253bf118b493c9bea7d6899012cc88", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.49218812417305924, "ground_truth": 0}, {"key": "4b23ce1db7253bf118b493c9bea7d6899012cc88", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.3468730859481264, "ground_truth": 0}, {"key": "4b23ce1db7253bf118b493c9bea7d6899012cc88", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.4282333877065829, "ground_truth": 0}, {"key": "c220780a60f76cdd1f6fd9a84abac736c3ee8ace", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.7041601610647701, "ground_truth": 0}, {"key": "c220780a60f76cdd1f6fd9a84abac736c3ee8ace", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.8529354800388905, "ground_truth": 0}, {"key": "c220780a60f76cdd1f6fd9a84abac736c3ee8ace", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.5117166046256179, "ground_truth": 0}, {"key": "c220780a60f76cdd1f6fd9a84abac736c3ee8ace", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.675764615385452, "ground_truth": 0}, {"key": "c220780a60f76cdd1f6fd9a84abac736c3ee8ace", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.86246753383548, "ground_truth": 0}, {"key": "9c7687a36469fc0e2203edb31f303274a611fb12", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.11436852172971447, "ground_truth": 0}, {"key": "9c7687a36469fc0e2203edb31f303274a611fb12", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.42250462600409433, "ground_truth": 0}, {"key": "9c7687a36469fc0e2203edb31f303274a611fb12", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.0900929973478963, "ground_truth": 0}, {"key": "9c7687a36469fc0e2203edb31f303274a611fb12", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.10594827417726348, "ground_truth": 0}, {"key": "9c7687a36469fc0e2203edb31f303274a611fb12", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.13846179536731448, "ground_truth": 0}, {"key": "8ab7fe3b19bb45c977cb74ed675579a20611ad9b", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.7090191349534783, "ground_truth": 0}, {"key": "8ab7fe3b19bb45c977cb74ed675579a20611ad9b", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.35756751099338435, "ground_truth": 0}, {"key": "8ab7fe3b19bb45c977cb74ed675579a20611ad9b", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.5832033466139939, "ground_truth": 0}, {"key": "8ab7fe3b19bb45c977cb74ed675579a20611ad9b", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.44746029717860275, "ground_truth": 0}, {"key": "8ab7fe3b19bb45c977cb74ed675579a20611ad9b", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.588889139299566, "ground_truth": 0}, {"key": "dfedf6786976733d8e33e7848ea8a7aa735bbcab", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.723309471925359, "ground_truth": 0}, {"key": "dfedf6786976733d8e33e7848ea8a7aa735bbcab", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.4205995739775474, "ground_truth": 0}, {"key": "dfedf6786976733d8e33e7848ea8a7aa735bbcab", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.5813030642386603, "ground_truth": 0}, {"key": "dfedf6786976733d8e33e7848ea8a7aa735bbcab", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.5926666024294498, "ground_truth": 0}, {"key": "dfedf6786976733d8e33e7848ea8a7aa735bbcab", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.7295197838569664, "ground_truth": 0}, {"key": "825f58580dd78cdcc7fbc10a00807e043c7b4468", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.41869690128926323, "ground_truth": 0}, {"key": "825f58580dd78cdcc7fbc10a00807e043c7b4468", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.5331544102095562, "ground_truth": 0}, {"key": "825f58580dd78cdcc7fbc10a00807e043c7b4468", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.5019531300024844, "ground_truth": 0}, {"key": "825f58580dd78cdcc7fbc10a00807e043c7b4468", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.3979384146589568, "ground_truth": 0}, {"key": "825f58580dd78cdcc7fbc10a00807e043c7b4468", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.4244119675370725, "ground_truth": 0}, {"key": "8bd6dc9f3ebb23fe20f74c1956184064b5b95509", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.3593641149475087, "ground_truth": 0}, {"key": "8bd6dc9f3ebb23fe20f74c1956184064b5b95509", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.4474602634532362, "ground_truth": 0}, {"key": "8bd6dc9f3ebb23fe20f74c1956184064b5b95509", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.25534366402056136, "ground_truth": 0}, {"key": "8bd6dc9f3ebb23fe20f74c1956184064b5b95509", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.27982850949814786, "ground_truth": 0}, {"key": "8bd6dc9f3ebb23fe20f74c1956184064b5b95509", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.5078118759658273, "ground_truth": 0}, {"key": "a7f6d4487a3ba7c4fc29e9b410820891f4c4f086", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.8832359882488184, "ground_truth": 0}, {"key": "a7f6d4487a3ba7c4fc29e9b410820891f4c4f086", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.9358173515507215, "ground_truth": 0}, {"key": "a7f6d4487a3ba7c4fc29e9b410820891f4c4f086", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.9314625135014011, "ground_truth": 0}, {"key": "a7f6d4487a3ba7c4fc29e9b410820891f4c4f086", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.8116760162602442, "ground_truth": 0}, {"key": "a7f6d4487a3ba7c4fc29e9b410820891f4c4f086", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.9429286065442332, "ground_truth": 0}, {"key": "b27ad09982665477dacdb7d06a33134bf064dd8d", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.4054487306199596, "ground_truth": 0}, {"key": "b27ad09982665477dacdb7d06a33134bf064dd8d", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.6495786316247442, "ground_truth": 0}, {"key": "b27ad09982665477dacdb7d06a33134bf064dd8d", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.7718435072856812, "ground_truth": 0}, {"key": "b27ad09982665477dacdb7d06a33134bf064dd8d", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.6001883337509922, "ground_truth": 0}, {"key": "b27ad09982665477dacdb7d06a33134bf064dd8d", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.6774740044053108, "ground_truth": 0}, {"key": "905891c3a21e76ad63d63dfe55e569a4cab25583", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.5409238607982689, "ground_truth": 0}, {"key": "905891c3a21e76ad63d63dfe55e569a4cab25583", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.588889135013503, "ground_truth": 0}, {"key": "905891c3a21e76ad63d63dfe55e569a4cab25583", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.7786493169093331, "ground_truth": 0}, {"key": "905891c3a21e76ad63d63dfe55e569a4cab25583", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.720171488279064, "ground_truth": 0}, {"key": "905891c3a21e76ad63d63dfe55e569a4cab25583", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.7704647848744285, "ground_truth": 0}, {"key": "626460b8ec58252c82ff5513aa754190332780aa", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.4687906303536466, "ground_truth": 0}, {"key": "626460b8ec58252c82ff5513aa754190332780aa", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.5698526516482126, "ground_truth": 0}, {"key": "626460b8ec58252c82ff5513aa754190332780aa", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.3923368115426079, "ground_truth": 0}, {"key": "626460b8ec58252c82ff5513aa754190332780aa", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.41300357662711334, "ground_truth": 0}, {"key": "626460b8ec58252c82ff5513aa754190332780aa", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.4474603073587872, "ground_truth": 0}, {"key": "31d0ed7b1b8f65c6479fb35683d72de21d70796a", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.9755769091025106, "ground_truth": 0}, {"key": "31d0ed7b1b8f65c6479fb35683d72de21d70796a", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.9706877688189922, "ground_truth": 0}, {"key": "31d0ed7b1b8f65c6479fb35683d72de21d70796a", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.9678992918446293, "ground_truth": 0}, {"key": "31d0ed7b1b8f65c6479fb35683d72de21d70796a", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.9856076628244781, "ground_truth": 0}, {"key": "31d0ed7b1b8f65c6479fb35683d72de21d70796a", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.9651191124058088, "ground_truth": 0}, {"key": "b03ee4df6492038d0a1d99a1717d8ad8ccc06db3", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.7981867782742841, "ground_truth": 0}, {"key": "b03ee4df6492038d0a1d99a1717d8ad8ccc06db3", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.5019531323674767, "ground_truth": 0}, {"key": "b03ee4df6492038d0a1d99a1717d8ad8ccc06db3", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.7008947828914971, "ground_truth": 0}, {"key": "b03ee4df6492038d0a1d99a1717d8ad8ccc06db3", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.7905303174749289, "ground_truth": 0}, {"key": "b03ee4df6492038d0a1d99a1717d8ad8ccc06db3", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.3904758357811495, "ground_truth": 0}, {"key": "ad9abc78fb2de88267b854f2aed110e2a5b8c3f1", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.9717790112333494, "ground_truth": 0}, {"key": "ad9abc78fb2de88267b854f2aed110e2a5b8c3f1", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.9539660995108762, "ground_truth": 0}, {"key": "ad9abc78fb2de88267b854f2aed110e2a5b8c3f1", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.9877587236644308, "ground_truth": 0}, {"key": "ad9abc78fb2de88267b854f2aed110e2a5b8c3f1", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.9416541636024722, "ground_truth": 0}, {"key": "ad9abc78fb2de88267b854f2aed110e2a5b8c3f1", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.9458012719097244, "ground_truth": 0}, {"key": "75cc16a7ba1970ba791da4ba43e6220f37f47697", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.7446563545226835, "ground_truth": 0}, {"key": "75cc16a7ba1970ba791da4ba43e6220f37f47697", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.7401743632339316, "ground_truth": 0}, {"key": "75cc16a7ba1970ba791da4ba43e6220f37f47697", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.6992544145591572, "ground_truth": 0}, {"key": "75cc16a7ba1970ba791da4ba43e6220f37f47697", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.782662478971903, "ground_truth": 0}, {"key": "75cc16a7ba1970ba791da4ba43e6220f37f47697", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.5078118687726904, "ground_truth": 0}, {"key": "fe9d63d0ed719a42735cadaf10e76416545f680c", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.743168009364938, "ground_truth": 0}, {"key": "fe9d63d0ed719a42735cadaf10e76416545f680c", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.7341195172482812, "ground_truth": 0}, {"key": "fe9d63d0ed719a42735cadaf10e76416545f680c", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.6976089079084746, "ground_truth": 0}, {"key": "fe9d63d0ed719a42735cadaf10e76416545f680c", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.48438010184861857, "ground_truth": 0}, {"key": "fe9d63d0ed719a42735cadaf10e76416545f680c", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.6095241637809596, "ground_truth": 0}, {"key": "1744093a3fea8b8de0777b1a228c3ba3e515d48e", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.5117165907554818, "ground_truth": 0}, {"key": "1744093a3fea8b8de0777b1a228c3ba3e515d48e", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.41869690431986883, "ground_truth": 0}, {"key": "1744093a3fea8b8de0777b1a228c3ba3e515d48e", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.3793783757162048, "ground_truth": 0}, {"key": "1744093a3fea8b8de0777b1a228c3ba3e515d48e", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.30735800426671467, "ground_truth": 0}, {"key": "1744093a3fea8b8de0777b1a228c3ba3e515d48e", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.5253688125330003, "ground_truth": 0}, {"key": "4929479f70e89deb22539e7d2caa6c33bbb0a14f", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.4436004318688319, "ground_truth": 0}, {"key": "4929479f70e89deb22539e7d2caa6c33bbb0a14f", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.38306418103316126, "ground_truth": 0}, {"key": "4929479f70e89deb22539e7d2caa6c33bbb0a14f", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.332852336129636, "ground_truth": 0}, {"key": "4929479f70e89deb22539e7d2caa6c33bbb0a14f", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.6584174950144644, "ground_truth": 0}, {"key": "4929479f70e89deb22539e7d2caa6c33bbb0a14f", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.7799929180317754, "ground_truth": 0}, {"key": "4dd3bb1fe7a5b0d42f0df8d9e62b81c673475420", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.8187367871145215, "ground_truth": 0}, {"key": "4dd3bb1fe7a5b0d42f0df8d9e62b81c673475420", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.8887587956741276, "ground_truth": 0}, {"key": "4dd3bb1fe7a5b0d42f0df8d9e62b81c673475420", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.9184802492998342, "ground_truth": 0}, {"key": "4dd3bb1fe7a5b0d42f0df8d9e62b81c673475420", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.789233684453488, "ground_truth": 0}, {"key": "4dd3bb1fe7a5b0d42f0df8d9e62b81c673475420", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.905322302572196, "ground_truth": 0}, {"key": "32f0c7b0845e88c7ff34bb9d358a86e029dc2261", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.4941409003936922, "ground_truth": 0}, {"key": "32f0c7b0845e88c7ff34bb9d358a86e029dc2261", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.35756751099338435, "ground_truth": 0}, {"key": "32f0c7b0845e88c7ff34bb9d358a86e029dc2261", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.5621765003051749, "ground_truth": 0}, {"key": "32f0c7b0845e88c7ff34bb9d358a86e029dc2261", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.3123700033885682, "ground_truth": 0}, {"key": "32f0c7b0845e88c7ff34bb9d358a86e029dc2261", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.588889139299566, "ground_truth": 0}, {"key": "607ce3caeeac56d7c4250aaa161871535cd1251e", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.573678401993508, "ground_truth": 0}, {"key": "607ce3caeeac56d7c4250aaa161871535cd1251e", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.7386690758967656, "ground_truth": 0}, {"key": "607ce3caeeac56d7c4250aaa161871535cd1251e", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.5888891349720178, "ground_truth": 0}, {"key": "607ce3caeeac56d7c4250aaa161871535cd1251e", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.5983122207714086, "ground_truth": 0}, {"key": "607ce3caeeac56d7c4250aaa161871535cd1251e", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.5273165274771224, "ground_truth": 0}, {"key": "7fb19f75d5d3feefeababf62d2ac91bf684a8038", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.844921535113944, "ground_truth": 0}, {"key": "7fb19f75d5d3feefeababf62d2ac91bf684a8038", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.8832359864034227, "ground_truth": 0}, {"key": "7fb19f75d5d3feefeababf62d2ac91bf684a8038", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.6020615912501002, "ground_truth": 0}, {"key": "7fb19f75d5d3feefeababf62d2ac91bf684a8038", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.8947894701679961, "ground_truth": 0}, {"key": "7fb19f75d5d3feefeababf62d2ac91bf684a8038", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.8984105481142528, "ground_truth": 0}, {"key": "4a70f83728ee66801be719df00060cda4c25817f", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.35042137237583343, "ground_truth": 0}, {"key": "4a70f83728ee66801be719df00060cda4c25817f", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.3793783909144986, "ground_truth": 0}, {"key": "4a70f83728ee66801be719df00060cda4c25817f", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.343341737238028, "ground_truth": 0}, {"key": "4a70f83728ee66801be719df00060cda4c25817f", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.6224593210825099, "ground_truth": 0}, {"key": "4a70f83728ee66801be719df00060cda4c25817f", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.5253688230712241, "ground_truth": 0}, {"key": "dcfc0e6ff732124026991e89d50727876f50351f", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.8774767812895303, "ground_truth": 0}, {"key": "dcfc0e6ff732124026991e89d50727876f50351f", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.8732148248162592, "ground_truth": 0}, {"key": "dcfc0e6ff732124026991e89d50727876f50351f", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.8198933421193267, "ground_truth": 0}, {"key": "dcfc0e6ff732124026991e89d50727876f50351f", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.7356416211929834, "ground_truth": 0}, {"key": "dcfc0e6ff732124026991e89d50727876f50351f", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.8198933286956736, "ground_truth": 0}, {"key": "ace7f6d9e984397bda16bf441019f1584f036b2a", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.9863631638101732, "ground_truth": 0}, {"key": "ace7f6d9e984397bda16bf441019f1584f036b2a", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.9688561658728663, "ground_truth": 0}, {"key": "ace7f6d9e984397bda16bf441019f1584f036b2a", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.9813106912841199, "ground_truth": 0}, {"key": "ace7f6d9e984397bda16bf441019f1584f036b2a", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.9879462210202807, "ground_truth": 0}, {"key": "ace7f6d9e984397bda16bf441019f1584f036b2a", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.9678992930369795, "ground_truth": 0}, {"key": "6f12c9d47e70bfa86d72685d018ddd1161157e8e", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.4474602993074256, "ground_truth": 0}, {"key": "6f12c9d47e70bfa86d72685d018ddd1161157e8e", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.6654105624808027, "ground_truth": 0}, {"key": "6f12c9d47e70bfa86d72685d018ddd1161157e8e", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.624293508618663, "ground_truth": 0}, {"key": "6f12c9d47e70bfa86d72685d018ddd1161157e8e", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.6706082846970454, "ground_truth": 0}, {"key": "6f12c9d47e70bfa86d72685d018ddd1161157e8e", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.6297746264765909, "ground_truth": 0}, {"key": "b32b72e5cf9e133e5be33eccbb2dc9ab5578ae84", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.39981166111289157, "ground_truth": 0}, {"key": "b32b72e5cf9e133e5be33eccbb2dc9ab5578ae84", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.5428632749492357, "ground_truth": 0}, {"key": "b32b72e5cf9e133e5be33eccbb2dc9ab5578ae84", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.3468730686276519, "ground_truth": 0}, {"key": "b32b72e5cf9e133e5be33eccbb2dc9ab5578ae84", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.3593641292866061, "ground_truth": 0}, {"key": "b32b72e5cf9e133e5be33eccbb2dc9ab5578ae84", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.540923845969784, "ground_truth": 0}, {"key": "0ae5e35dc2844afc251d082d8d5ef4be8edce58c", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.5136684580777262, "ground_truth": 0}, {"key": "0ae5e35dc2844afc251d082d8d5ef4be8edce58c", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.9334308128329744, "ground_truth": 0}, {"key": "0ae5e35dc2844afc251d082d8d5ef4be8edce58c", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.7386690790932532, "ground_truth": 0}, {"key": "0ae5e35dc2844afc251d082d8d5ef4be8edce58c", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.6791786958647704, "ground_truth": 0}, {"key": "0ae5e35dc2844afc251d082d8d5ef4be8edce58c", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.8723473778602974, "ground_truth": 0}, {"key": "ffb817ce85d7c19720ebbf0b43b01d0da61e9c06", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.4205995950818637, "ground_truth": 0}, {"key": "ffb817ce85d7c19720ebbf0b43b01d0da61e9c06", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.5869964341132249, "ground_truth": 0}, {"key": "ffb817ce85d7c19720ebbf0b43b01d0da61e9c06", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.5136684715614487, "ground_truth": 0}, {"key": "ffb817ce85d7c19720ebbf0b43b01d0da61e9c06", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.44552952834861603, "ground_truth": 0}, {"key": "ffb817ce85d7c19720ebbf0b43b01d0da61e9c06", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.3812195556694546, "ground_truth": 0}, {"key": "9bfd6a5beb4e8dec59ba6d805dc9349a401da51d", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.6352224548379319, "ground_truth": 0}, {"key": "9bfd6a5beb4e8dec59ba6d805dc9349a401da51d", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.6242935465696805, "ground_truth": 0}, {"key": "9bfd6a5beb4e8dec59ba6d805dc9349a401da51d", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.787931190600723, "ground_truth": 0}, {"key": "9bfd6a5beb4e8dec59ba6d805dc9349a401da51d", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.5869964051377159, "ground_truth": 0}, {"key": "9bfd6a5beb4e8dec59ba6d805dc9349a401da51d", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.6808786110560526, "ground_truth": 0}, {"key": "dc7f4527bf654918c7a4bb19179949ecd5982c0f", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.8449215319243198, "ground_truth": 0}, {"key": "dc7f4527bf654918c7a4bb19179949ecd5982c0f", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.8140527935201953, "ground_truth": 0}, {"key": "dc7f4527bf654918c7a4bb19179949ecd5982c0f", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.7892337008600315, "ground_truth": 0}, {"key": "dc7f4527bf654918c7a4bb19179949ecd5982c0f", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.7813306237606237, "ground_truth": 0}, {"key": "dc7f4527bf654918c7a4bb19179949ecd5982c0f", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.8539127584629721, "ground_truth": 0}, {"key": "c60e77736087bc85b372a28b4724aae6dcf0b052", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.32594953019638945, "ground_truth": 0}, {"key": "c60e77736087bc85b372a28b4724aae6dcf0b052", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.4282333782586049, "ground_truth": 0}, {"key": "c60e77736087bc85b372a28b4724aae6dcf0b052", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.35220176131178815, "ground_truth": 0}, {"key": "c60e77736087bc85b372a28b4724aae6dcf0b052", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.3225259931084796, "ground_truth": 0}, {"key": "c60e77736087bc85b372a28b4724aae6dcf0b052", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.409220779323321, "ground_truth": 0}, {"key": "e0953e2de7cf286ac1d87a41c62e37f21b7c7564", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.6909762943467836, "ground_truth": 0}, {"key": "e0953e2de7cf286ac1d87a41c62e37f21b7c7564", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.590779207292291, "ground_truth": 0}, {"key": "e0953e2de7cf286ac1d87a41c62e37f21b7c7564", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.6584174945964494, "ground_truth": 0}, {"key": "e0953e2de7cf286ac1d87a41c62e37f21b7c7564", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.5253688229805644, "ground_truth": 0}, {"key": "e0953e2de7cf286ac1d87a41c62e37f21b7c7564", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.5058590999710699, "ground_truth": 0}, {"key": "8b6f228661fd5f3170dc2c2e6b353e1d6c3859ec", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.3090237288619229, "ground_truth": 0}, {"key": "8b6f228661fd5f3170dc2c2e6b353e1d6c3859ec", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.2704802053281174, "ground_truth": 0}, {"key": "8b6f228661fd5f3170dc2c2e6b353e1d6c3859ec", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.6297746162926033, "ground_truth": 0}, {"key": "8b6f228661fd5f3170dc2c2e6b353e1d6c3859ec", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.34864513737686026, "ground_truth": 0}, {"key": "8b6f228661fd5f3170dc2c2e6b353e1d6c3859ec", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.2704802309471449, "ground_truth": 0}, {"key": "2f482e021caf07e2f07baf111c36d1587758f188", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.34334173174876786, "ground_truth": 0}, {"key": "2f482e021caf07e2f07baf111c36d1587758f188", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.638835270838917, "ground_truth": 0}, {"key": "2f482e021caf07e2f07baf111c36d1587758f188", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.3923368443972194, "ground_truth": 0}, {"key": "2f482e021caf07e2f07baf111c36d1587758f188", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.4301473578012504, "ground_truth": 0}, {"key": "2f482e021caf07e2f07baf111c36d1587758f188", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.39606817182135096, "ground_truth": 0}, {"key": "dc8ce4207b91a323bf6e2fbab889efeed22aa428", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.7295197777224168, "ground_truth": 0}, {"key": "dc8ce4207b91a323bf6e2fbab889efeed22aa428", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.7969253673649423, "ground_truth": 0}, {"key": "dc8ce4207b91a323bf6e2fbab889efeed22aa428", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.5214711398972026, "ground_truth": 0}, {"key": "dc8ce4207b91a323bf6e2fbab889efeed22aa428", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.6424324762119256, "ground_truth": 0}, {"key": "dc8ce4207b91a323bf6e2fbab889efeed22aa428", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.447460281442308, "ground_truth": 0}, {"key": "22a9005fe99c5dd536a4f41de4eb59d4f633ef9e", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.7356416535583423, "ground_truth": 0}, {"key": "22a9005fe99c5dd536a4f41de4eb59d4f633ef9e", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.8732148255060065, "ground_truth": 0}, {"key": "22a9005fe99c5dd536a4f41de4eb59d4f633ef9e", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.8740772300591292, "ground_truth": 0}, {"key": "22a9005fe99c5dd536a4f41de4eb59d4f633ef9e", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.8365545506358116, "ground_truth": 0}, {"key": "22a9005fe99c5dd536a4f41de4eb59d4f633ef9e", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.888758778907549, "ground_truth": 0}, {"key": "1b00b2d2edef396855ad392f08a6e74550af569b", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.7505527638190955, "ground_truth": 0}, {"key": "1b00b2d2edef396855ad392f08a6e74550af569b", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.5945512789828079, "ground_truth": 0}, {"key": "1b00b2d2edef396855ad392f08a6e74550af569b", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.7371581504653578, "ground_truth": 0}, {"key": "1b00b2d2edef396855ad392f08a6e74550af569b", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.9026096002191116, "ground_truth": 0}, {"key": "1b00b2d2edef396855ad392f08a6e74550af569b", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.7008948168860539, "ground_truth": 0}, {"key": "9b43472077873c45e7f278418885ad028eb993e3", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.17441027464225403, "ground_truth": 0}, {"key": "9b43472077873c45e7f278418885ad028eb993e3", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.12765261907554712, "ground_truth": 0}, {"key": "9b43472077873c45e7f278418885ad028eb993e3", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.22815650414720992, "ground_truth": 0}, {"key": "9b43472077873c45e7f278418885ad028eb993e3", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.23231016759566564, "ground_truth": 0}, {"key": "9b43472077873c45e7f278418885ad028eb993e3", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.48242911947226313, "ground_truth": 0}, {"key": "281347d0e99bc099d6991a6a60e30dc13d558216", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.840782606626563, "ground_truth": 0}, {"key": "281347d0e99bc099d6991a6a60e30dc13d558216", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.7799928864139962, "ground_truth": 0}, {"key": "281347d0e99bc099d6991a6a60e30dc13d558216", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.7201714951308957, "ground_truth": 0}, {"key": "281347d0e99bc099d6991a6a60e30dc13d558216", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.6095241587025273, "ground_truth": 0}, {"key": "281347d0e99bc099d6991a6a60e30dc13d558216", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.6206216315367422, "ground_truth": 0}, {"key": "703d248cce913a6036347aabd2ba011a7f660bf4", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.7325918251994689, "ground_truth": 0}, {"key": "703d248cce913a6036347aabd2ba011a7f660bf4", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.4610167812119153, "ground_truth": 0}, {"key": "703d248cce913a6036347aabd2ba011a7f660bf4", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.3259495407605704, "ground_truth": 0}, {"key": "703d248cce913a6036347aabd2ba011a7f660bf4", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.5907792113024141, "ground_truth": 0}, {"key": "703d248cce913a6036347aabd2ba011a7f660bf4", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.6825737183422633, "ground_truth": 0}, {"key": "517b86691dda04f41123354c1b7a7bfe1290eadc", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.6150878584805678, "ground_truth": 0}, {"key": "517b86691dda04f41123354c1b7a7bfe1290eadc", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.35042137529083983, "ground_truth": 0}, {"key": "517b86691dda04f41123354c1b7a7bfe1290eadc", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.6477982155801059, "ground_truth": 0}, {"key": "517b86691dda04f41123354c1b7a7bfe1290eadc", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.49804687538973197, "ground_truth": 0}, {"key": "517b86691dda04f41123354c1b7a7bfe1290eadc", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.3468730721023379, "ground_truth": 0}, {"key": "7b361feeebfb078b80831d40d2ad8640c361e049", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.7839884747448286, "ground_truth": 0}, {"key": "7b361feeebfb078b80831d40d2ad8640c361e049", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.70740468406597, "ground_truth": 0}, {"key": "7b361feeebfb078b80831d40d2ad8640c361e049", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.8031737878073736, "ground_truth": 0}, {"key": "7b361feeebfb078b80831d40d2ad8640c361e049", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.7905303038627578, "ground_truth": 0}, {"key": "7b361feeebfb078b80831d40d2ad8640c361e049", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.7185943895369273, "ground_truth": 0}, {"key": "7d8e196095e4561ee4f01c650101f5591fce4a8d", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.230919756537652, "ground_truth": 0}, {"key": "7d8e196095e4561ee4f01c650101f5591fce4a8d", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.40356686511583484, "ground_truth": 0}, {"key": "7d8e196095e4561ee4f01c650101f5591fce4a8d", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.17217184483070125, "ground_truth": 0}, {"key": "7d8e196095e4561ee4f01c650101f5591fce4a8d", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.41869689971961416, "ground_truth": 0}, {"key": "7d8e196095e4561ee4f01c650101f5591fce4a8d", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.32939172608940687, "ground_truth": 0}, {"key": "ae03390949407f55c8d8f794896af3020d180b12", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.33458942425052846, "ground_truth": 0}, {"key": "ae03390949407f55c8d8f794896af3020d180b12", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.17441028481455523, "ground_truth": 0}, {"key": "ae03390949407f55c8d8f794896af3020d180b12", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.16451645512202523, "ground_truth": 0}, {"key": "ae03390949407f55c8d8f794896af3020d180b12", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.2909808683282071, "ground_truth": 0}, {"key": "ae03390949407f55c8d8f794896af3020d180b12", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.30404167146331545, "ground_truth": 0}, {"key": "4160464d3fcba547cb1664e54ce51ad06f78b773", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.4707365976756972, "ground_truth": 0}, {"key": "4160464d3fcba547cb1664e54ce51ad06f78b773", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.4148988397588096, "ground_truth": 0}, {"key": "4160464d3fcba547cb1664e54ce51ad06f78b773", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.5214711627445563, "ground_truth": 0}, {"key": "4160464d3fcba547cb1664e54ce51ad06f78b773", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.677474036434512, "ground_truth": 0}, {"key": "4160464d3fcba547cb1664e54ce51ad06f78b773", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.6424324556055715, "ground_truth": 0}, {"key": "72b396634cc46f29b5ef146a61073ee7e7fa3cdc", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.8529354738243918, "ground_truth": 0}, {"key": "72b396634cc46f29b5ef146a61073ee7e7fa3cdc", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.9278877970539379, "ground_truth": 0}, {"key": "72b396634cc46f29b5ef146a61073ee7e7fa3cdc", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.9367494800002106, "ground_truth": 0}, {"key": "72b396634cc46f29b5ef146a61073ee7e7fa3cdc", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.8766343853977678, "ground_truth": 0}, {"key": "72b396634cc46f29b5ef146a61073ee7e7fa3cdc", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.8998277773889048, "ground_truth": 0}, {"key": "b9b09b290cdf4d74cb64684a6cae8b6832645607", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.773216373778007, "ground_truth": 0}, {"key": "b9b09b290cdf4d74cb64684a6cae8b6832645607", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.9105454000113513, "ground_truth": 0}, {"key": "b9b09b290cdf4d74cb64684a6cae8b6832645607", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.7676898554504535, "ground_truth": 0}, {"key": "b9b09b290cdf4d74cb64684a6cae8b6832645607", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.8519528041217127, "ground_truth": 0}, {"key": "b9b09b290cdf4d74cb64684a6cae8b6832645607", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.5964331236708974, "ground_truth": 0}, {"key": "9e49d58fa5ab7f3e4356cb61337605ac007c49ca", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.26435836584708794, "ground_truth": 0}, {"key": "9e49d58fa5ab7f3e4356cb61337605ac007c49ca", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.5506073588817375, "ground_truth": 0}, {"key": "9e49d58fa5ab7f3e4356cb61337605ac007c49ca", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.27512973327167034, "ground_truth": 0}, {"key": "9e49d58fa5ab7f3e4356cb61337605ac007c49ca", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.4785288469570237, "ground_truth": 0}, {"key": "9e49d58fa5ab7f3e4356cb61337605ac007c49ca", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.4397473278738015, "ground_truth": 0}, {"key": "47fe0e2bba8206014fb53a7d5247efd1e316e087", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.3451052805688803, "ground_truth": 0}, {"key": "47fe0e2bba8206014fb53a7d5247efd1e316e087", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.2509127800944199, "ground_truth": 0}, {"key": "47fe0e2bba8206014fb53a7d5247efd1e316e087", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.1338674946208082, "ground_truth": 0}, {"key": "47fe0e2bba8206014fb53a7d5247efd1e316e087", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.4301473448485423, "ground_truth": 0}, {"key": "47fe0e2bba8206014fb53a7d5247efd1e316e087", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.16451645386364835, "ground_truth": 0}, {"key": "f54f84affaebd1d86011ad31adbf9fac4754a8f2", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.5175708891818389, "ground_truth": 0}, {"key": "f54f84affaebd1d86011ad31adbf9fac4754a8f2", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.43782348402975474, "ground_truth": 0}, {"key": "f54f84affaebd1d86011ad31adbf9fac4754a8f2", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.5964331263207525, "ground_truth": 0}, {"key": "f54f84affaebd1d86011ad31adbf9fac4754a8f2", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.6477982280486886, "ground_truth": 0}, {"key": "f54f84affaebd1d86011ad31adbf9fac4754a8f2", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.3886180548291493, "ground_truth": 0}, {"key": "bc4992871e25e6584936af456ad4b819dcc52f27", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.8006919998510281, "ground_truth": 0}, {"key": "bc4992871e25e6584936af456ad4b819dcc52f27", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.790530332660557, "ground_truth": 0}, {"key": "bc4992871e25e6584936af456ad4b819dcc52f27", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.5058591143879302, "ground_truth": 0}, {"key": "bc4992871e25e6584936af456ad4b819dcc52f27", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.7866228213084944, "ground_truth": 0}, {"key": "bc4992871e25e6584936af456ad4b819dcc52f27", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.6909762822193674, "ground_truth": 0}, {"key": "271416bf0f15c52a4417339de78dcecf378b3950", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.8221891260871947, "ground_truth": 0}, {"key": "271416bf0f15c52a4417339de78dcecf378b3950", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.919642532983241, "ground_truth": 0}, {"key": "271416bf0f15c52a4417339de78dcecf378b3950", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.6926419735543313, "ground_truth": 0}, {"key": "271416bf0f15c52a4417339de78dcecf378b3950", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.8652240831744582, "ground_truth": 0}, {"key": "271416bf0f15c52a4417339de78dcecf378b3950", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.8418256383736531, "ground_truth": 0}, {"key": "0add6b43e18072837f0bef41031d6f92f740d625", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.28616925910567487, "ground_truth": 0}, {"key": "0add6b43e18072837f0bef41031d6f92f740d625", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.6352224371044599, "ground_truth": 0}, {"key": "0add6b43e18072837f0bef41031d6f92f740d625", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.5583269668893154, "ground_truth": 0}, {"key": "0add6b43e18072837f0bef41031d6f92f740d625", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.5907792003570286, "ground_truth": 0}, {"key": "0add6b43e18072837f0bef41031d6f92f740d625", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.7759445361264252, "ground_truth": 0}, {"key": "7060e3feb685bda7b5102e1cc8e9b35da37ca2a1", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.7170118717378681, "ground_truth": 0}, {"key": "7060e3feb685bda7b5102e1cc8e9b35da37ca2a1", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.5869964325614258, "ground_truth": 0}, {"key": "7060e3feb685bda7b5102e1cc8e9b35da37ca2a1", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.6601723748797114, "ground_truth": 0}, {"key": "7060e3feb685bda7b5102e1cc8e9b35da37ca2a1", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.6842640132116461, "ground_truth": 0}, {"key": "7060e3feb685bda7b5102e1cc8e9b35da37ca2a1", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.6132365629723667, "ground_truth": 0}, {"key": "04fbd3088e8610dd4d5bea709e7cc5ee3e53710d", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.49218814485093565, "ground_truth": 0}, {"key": "04fbd3088e8610dd4d5bea709e7cc5ee3e53710d", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.4629586060371195, "ground_truth": 0}, {"key": "04fbd3088e8610dd4d5bea709e7cc5ee3e53710d", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.5736784079354039, "ground_truth": 0}, {"key": "04fbd3088e8610dd4d5bea709e7cc5ee3e53710d", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.6370307981118991, "ground_truth": 0}, {"key": "04fbd3088e8610dd4d5bea709e7cc5ee3e53710d", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.37570648350069313, "ground_truth": 0}, {"key": "b198f0356c0f0cb09aba4d7d5541dd7c5ce91678", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.7563575594384545, "ground_truth": 0}, {"key": "b198f0356c0f0cb09aba4d7d5541dd7c5ce91678", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.8887587956741276, "ground_truth": 0}, {"key": "b198f0356c0f0cb09aba4d7d5541dd7c5ce91678", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.7772998832462285, "ground_truth": 0}, {"key": "b198f0356c0f0cb09aba4d7d5541dd7c5ce91678", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.7386690808718218, "ground_truth": 0}, {"key": "b198f0356c0f0cb09aba4d7d5541dd7c5ce91678", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.905322302572196, "ground_truth": 0}, {"key": "0f60442453e038c6bbe3aa525bedf2a97f459e04", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.2538609969304901, "ground_truth": 0}, {"key": "0f60442453e038c6bbe3aa525bedf2a97f459e04", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.22000709929925327, "ground_truth": 0}, {"key": "0f60442453e038c6bbe3aa525bedf2a97f459e04", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.25386100390755884, "ground_truth": 0}, {"key": "0f60442453e038c6bbe3aa525bedf2a97f459e04", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.4054487701018554, "ground_truth": 0}, {"key": "0f60442453e038c6bbe3aa525bedf2a97f459e04", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.2120688047770633, "ground_truth": 0}, {"key": "79b423b90af6b3381ebfa34a7382ca472bdb5b35", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.49804690303853366, "ground_truth": 0}, {"key": "79b423b90af6b3381ebfa34a7382ca472bdb5b35", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.5602526525765313, "ground_truth": 0}, {"key": "79b423b90af6b3381ebfa34a7382ca472bdb5b35", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.5117166337814959, "ground_truth": 0}, {"key": "79b423b90af6b3381ebfa34a7382ca472bdb5b35", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.5544704708513423, "ground_truth": 0}, {"key": "79b423b90af6b3381ebfa34a7382ca472bdb5b35", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.30239108149758015, "ground_truth": 0}, {"key": "3e5a3a2dddee7ebebe57c12d0ace97a24cbabd72", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.7592253978311568, "ground_truth": 0}, {"key": "3e5a3a2dddee7ebebe57c12d0ace97a24cbabd72", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.6893056095411635, "ground_truth": 0}, {"key": "3e5a3a2dddee7ebebe57c12d0ace97a24cbabd72", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.8397339720619269, "ground_truth": 0}, {"key": "3e5a3a2dddee7ebebe57c12d0ace97a24cbabd72", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.6460136911031504, "ground_truth": 0}, {"key": "3e5a3a2dddee7ebebe57c12d0ace97a24cbabd72", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.7446563408809913, "ground_truth": 0}, {"key": "c623e4914c04811d354fa137e3bf7a00980ef7d7", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.6242935325082306, "ground_truth": 0}, {"key": "c623e4914c04811d354fa137e3bf7a00980ef7d7", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.6095241604253727, "ground_truth": 0}, {"key": "c623e4914c04811d354fa137e3bf7a00980ef7d7", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.5964331402938602, "ground_truth": 0}, {"key": "c623e4914c04811d354fa137e3bf7a00980ef7d7", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.41679664810502015, "ground_truth": 0}, {"key": "c623e4914c04811d354fa137e3bf7a00980ef7d7", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.5774953840147848, "ground_truth": 0}, {"key": "d5ef1fb6f2df20e46fb032b9e318bc8555283e78", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.581303080991049, "ground_truth": 0}, {"key": "d5ef1fb6f2df20e46fb032b9e318bc8555283e78", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.9026096107643123, "ground_truth": 0}, {"key": "d5ef1fb6f2df20e46fb032b9e318bc8555283e78", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.5774953950434609, "ground_truth": 0}, {"key": "d5ef1fb6f2df20e46fb032b9e318bc8555283e78", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.4301473659572543, "ground_truth": 0}, {"key": "d5ef1fb6f2df20e46fb032b9e318bc8555283e78", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.7799928975855375, "ground_truth": 0}, {"key": "e1a36c50adadc5db9ffe6fd2c5e275d522902193", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.35042137654055416, "ground_truth": 0}, {"key": "e1a36c50adadc5db9ffe6fd2c5e275d522902193", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.6279512056781942, "ground_truth": 0}, {"key": "e1a36c50adadc5db9ffe6fd2c5e275d522902193", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.40733339566889487, "ground_truth": 0}, {"key": "e1a36c50adadc5db9ffe6fd2c5e275d522902193", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.4902355932533287, "ground_truth": 0}, {"key": "e1a36c50adadc5db9ffe6fd2c5e275d522902193", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.40356683687981687, "ground_truth": 0}, {"key": "bad69c9a3c7d84a4717705a3063dd7367243772b", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.7201715080602444, "ground_truth": 0}, {"key": "bad69c9a3c7d84a4717705a3063dd7367243772b", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.7264256087225678, "ground_truth": 0}, {"key": "bad69c9a3c7d84a4717705a3063dd7367243772b", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.6619228832349011, "ground_truth": 0}, {"key": "bad69c9a3c7d84a4717705a3063dd7367243772b", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.48438009482572497, "ground_truth": 0}, {"key": "bad69c9a3c7d84a4717705a3063dd7367243772b", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.8019358401585931, "ground_truth": 0}, {"key": "4b40ad1f0e59b139e9a1466859ee08a048ca8d2c", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.527316498123552, "ground_truth": 0}, {"key": "4b40ad1f0e59b139e9a1466859ee08a048ca8d2c", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.3363310546843907, "ground_truth": 0}, {"key": "4b40ad1f0e59b139e9a1466859ee08a048ca8d2c", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.4397473535859357, "ground_truth": 0}, {"key": "4b40ad1f0e59b139e9a1466859ee08a048ca8d2c", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.4455295476472174, "ground_truth": 0}, {"key": "4b40ad1f0e59b139e9a1466859ee08a048ca8d2c", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.5621764925858909, "ground_truth": 0}, {"key": "c17a30b4c0f8f58e3afa6279a39470f65a179f6b", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.5234203285441787, "ground_truth": 0}, {"key": "c17a30b4c0f8f58e3afa6279a39470f65a179f6b", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.30902371438650256, "ground_truth": 0}, {"key": "c17a30b4c0f8f58e3afa6279a39470f65a179f6b", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.1778108726970466, "ground_truth": 0}, {"key": "c17a30b4c0f8f58e3afa6279a39470f65a179f6b", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.2974699213264198, "ground_truth": 0}, {"key": "c17a30b4c0f8f58e3afa6279a39470f65a179f6b", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.3415825041232865, "ground_truth": 0}, {"key": "6f579aad2d1f601b17e01057cd4b5e4942627230", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.3415825085935256, "ground_truth": 0}, {"key": "6f579aad2d1f601b17e01057cd4b5e4942627230", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.6315942856287569, "ground_truth": 0}, {"key": "6f579aad2d1f601b17e01057cd4b5e4942627230", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.6206216097533342, "ground_truth": 0}, {"key": "6f579aad2d1f601b17e01057cd4b5e4942627230", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.615087832983005, "ground_truth": 0}, {"key": "6f579aad2d1f601b17e01057cd4b5e4942627230", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.5506073670796541, "ground_truth": 0}, {"key": "7551f8e13485bb1738c16eccad343a14a47b2903", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.8976952826526488, "ground_truth": 0}, {"key": "7551f8e13485bb1738c16eccad343a14a47b2903", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.8300437768956175, "ground_truth": 0}, {"key": "7551f8e13485bb1738c16eccad343a14a47b2903", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.850964713695849, "ground_truth": 0}, {"key": "7551f8e13485bb1738c16eccad343a14a47b2903", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.8783142528145813, "ground_truth": 0}, {"key": "7551f8e13485bb1738c16eccad343a14a47b2903", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.8479677578375582, "ground_truth": 0}, {"key": "257d8d38863175ec9401d0532963fb71a47f0734", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.7057850229716371, "ground_truth": 0}, {"key": "257d8d38863175ec9401d0532963fb71a47f0734", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.5794004108815092, "ground_truth": 0}, {"key": "257d8d38863175ec9401d0532963fb71a47f0734", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.6513548717490187, "ground_truth": 0}, {"key": "257d8d38863175ec9401d0532963fb71a47f0734", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.7461390045642556, "ground_truth": 0}, {"key": "257d8d38863175ec9401d0532963fb71a47f0734", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.7799928968713438, "ground_truth": 0}, {"key": "aa596e10dfe78dd875a7e15bfd53138bc8bde471", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.2877678030962657, "ground_truth": 0}, {"key": "aa596e10dfe78dd875a7e15bfd53138bc8bde471", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.1847675096377428, "ground_truth": 0}, {"key": "aa596e10dfe78dd875a7e15bfd53138bc8bde471", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.2689414457034524, "ground_truth": 0}, {"key": "aa596e10dfe78dd875a7e15bfd53138bc8bde471", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.1766716060006852, "ground_truth": 0}, {"key": "aa596e10dfe78dd875a7e15bfd53138bc8bde471", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.13296424590747485, "ground_truth": 0}, {"key": "a0dff972172125f32b79977a47b0d250be8f71e4", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.6297746070147271, "ground_truth": 0}, {"key": "a0dff972172125f32b79977a47b0d250be8f71e4", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.8300437673842824, "ground_truth": 0}, {"key": "a0dff972172125f32b79977a47b0d250be8f71e4", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.6477982131301715, "ground_truth": 0}, {"key": "a0dff972172125f32b79977a47b0d250be8f71e4", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.5370414018208329, "ground_truth": 0}, {"key": "a0dff972172125f32b79977a47b0d250be8f71e4", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.7476159501162146, "ground_truth": 0}, {"key": "faac3a6337907b1552b7068c8701cae665c4885c", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.646013728611566, "ground_truth": 0}, {"key": "faac3a6337907b1552b7068c8701cae665c4885c", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.7918210705005228, "ground_truth": 0}, {"key": "faac3a6337907b1552b7068c8701cae665c4885c", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.7662936376536557, "ground_truth": 0}, {"key": "faac3a6337907b1552b7068c8701cae665c4885c", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.6224593041388742, "ground_truth": 0}, {"key": "faac3a6337907b1552b7068c8701cae665c4885c", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.7786493051160187, "ground_truth": 0}, {"key": "c741b211364d761605050776064a506d24378d10", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.6976089193212913, "ground_truth": 0}, {"key": "c741b211364d761605050776064a506d24378d10", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.4244119904020049, "ground_truth": 0}, {"key": "c741b211364d761605050776064a506d24378d10", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.5, "ground_truth": 0}, {"key": "c741b211364d761605050776064a506d24378d10", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.5679366260158424, "ground_truth": 0}, {"key": "c741b211364d761605050776064a506d24378d10", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.23370635637346393, "ground_truth": 0}, {"key": "a062b8ba08369be2364a863020a28de63a3cbf86", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.4320633813408523, "ground_truth": 0}, {"key": "a062b8ba08369be2364a863020a28de63a3cbf86", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.5195213311219236, "ground_truth": 0}, {"key": "a062b8ba08369be2364a863020a28de63a3cbf86", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.5544704408478364, "ground_truth": 0}, {"key": "a062b8ba08369be2364a863020a28de63a3cbf86", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.6825737252908884, "ground_truth": 0}, {"key": "a062b8ba08369be2364a863020a28de63a3cbf86", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.6334102609543386, "ground_truth": 0}, {"key": "f11102404d23702fe398b1d690d13418703e617a", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.9525741285912082, "ground_truth": 0}, {"key": "f11102404d23702fe398b1d690d13418703e617a", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.9711290941425299, "ground_truth": 0}, {"key": "f11102404d23702fe398b1d690d13418703e617a", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.9724147170827229, "ground_truth": 0}, {"key": "f11102404d23702fe398b1d690d13418703e617a", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.9854964204268913, "ground_truth": 0}, {"key": "f11102404d23702fe398b1d690d13418703e617a", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.9764905490487282, "ground_truth": 0}, {"key": "62481fda7e7b9714b994617909349550707fe8a7", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.6706082679657296, "ground_truth": 0}, {"key": "62481fda7e7b9714b994617909349550707fe8a7", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.8509647176953357, "ground_truth": 0}, {"key": "62481fda7e7b9714b994617909349550707fe8a7", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.8104789248255153, "ground_truth": 0}, {"key": "62481fda7e7b9714b994617909349550707fe8a7", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.7826624820696896, "ground_truth": 0}, {"key": "62481fda7e7b9714b994617909349550707fe8a7", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.7490872047369865, "ground_truth": 0}, {"key": "13943ef2d9c3b737c9a900f0cdb32a9c39121e6f", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.913058346006041, "ground_truth": 0}, {"key": "13943ef2d9c3b737c9a900f0cdb32a9c39121e6f", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.9632305321789556, "ground_truth": 0}, {"key": "13943ef2d9c3b737c9a900f0cdb32a9c39121e6f", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.7879311914061929, "ground_truth": 0}, {"key": "13943ef2d9c3b737c9a900f0cdb32a9c39121e6f", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.9433475757132608, "ground_truth": 0}, {"key": "13943ef2d9c3b737c9a900f0cdb32a9c39121e6f", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.9224823425897469, "ground_truth": 0}, {"key": "0c25e0cd62589fde1b378606febbcc5a2bafc770", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.9184802403083802, "ground_truth": 0}, {"key": "0c25e0cd62589fde1b378606febbcc5a2bafc770", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.8816149071442098, "ground_truth": 0}, {"key": "0c25e0cd62589fde1b378606febbcc5a2bafc770", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.8529354695523378, "ground_truth": 0}, {"key": "0c25e0cd62589fde1b378606febbcc5a2bafc770", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.9079671444723547, "ground_truth": 0}, {"key": "0c25e0cd62589fde1b378606febbcc5a2bafc770", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.9465966764715275, "ground_truth": 0}, {"key": "a86bc16fad35d84e988af4cc64bf14877337d47e", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.6791787037500249, "ground_truth": 0}, {"key": "a86bc16fad35d84e988af4cc64bf14877337d47e", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.8019358528260735, "ground_truth": 0}, {"key": "a86bc16fad35d84e988af4cc64bf14877337d47e", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.8210441202351957, "ground_truth": 0}, {"key": "a86bc16fad35d84e988af4cc64bf14877337d47e", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.7606506631473385, "ground_truth": 0}, {"key": "a86bc16fad35d84e988af4cc64bf14877337d47e", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.7994423228984305, "ground_truth": 0}, {"key": "0f937bcc8cd07bab2d5aa9a4492d3c2430063b67", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.7704647882614196, "ground_truth": 0}, {"key": "0f937bcc8cd07bab2d5aa9a4492d3c2430063b67", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.7170118722969336, "ground_truth": 0}, {"key": "0f937bcc8cd07bab2d5aa9a4492d3c2430063b67", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.9299510392874, "ground_truth": 0}, {"key": "0f937bcc8cd07bab2d5aa9a4492d3c2430063b67", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.731058548942538, "ground_truth": 0}, {"key": "0f937bcc8cd07bab2d5aa9a4492d3c2430063b67", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.7341195237958346, "ground_truth": 0}, {"key": "a6c0617d92807f05f02d767261c45b616382e499", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.5698526274761625, "ground_truth": 0}, {"key": "a6c0617d92807f05f02d767261c45b616382e499", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.6442251166120676, "ground_truth": 0}, {"key": "a6c0617d92807f05f02d767261c45b616382e499", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.43782349704532314, "ground_truth": 0}, {"key": "a6c0617d92807f05f02d767261c45b616382e499", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.5525396888621278, "ground_truth": 0}, {"key": "a6c0617d92807f05f02d767261c45b616382e499", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.6370307943719227, "ground_truth": 0}, {"key": "4f45a0576d353fa9b5b9d1c8e3cc0e6a1cd4897b", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.418696923548577, "ground_truth": 0}, {"key": "4f45a0576d353fa9b5b9d1c8e3cc0e6a1cd4897b", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.4746311749223924, "ground_truth": 0}, {"key": "4f45a0576d353fa9b5b9d1c8e3cc0e6a1cd4897b", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.4054487270462777, "ground_truth": 0}, {"key": "4f45a0576d353fa9b5b9d1c8e3cc0e6a1cd4897b", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.6513548609890046, "ground_truth": 0}, {"key": "4f45a0576d353fa9b5b9d1c8e3cc0e6a1cd4897b", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.48828340505775575, "ground_truth": 0}, {"key": "f6d43a207c2b3c48e787087b345c23d2fb1dc92f", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.8469578481391451, "ground_truth": 0}, {"key": "f6d43a207c2b3c48e787087b345c23d2fb1dc92f", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.7217432129946879, "ground_truth": 0}, {"key": "f6d43a207c2b3c48e787087b345c23d2fb1dc92f", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.782662479424395, "ground_truth": 0}, {"key": "f6d43a207c2b3c48e787087b345c23d2fb1dc92f", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.7606506739467408, "ground_truth": 0}, {"key": "f6d43a207c2b3c48e787087b345c23d2fb1dc92f", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.7690802391127363, "ground_truth": 0}, {"key": "e0127487aee3a00fe164d72eb697221079518471", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.824461942408016, "ground_truth": 0}, {"key": "e0127487aee3a00fe164d72eb697221079518471", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.7931059462393162, "ground_truth": 0}, {"key": "e0127487aee3a00fe164d72eb697221079518471", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.5851011692557785, "ground_truth": 0}, {"key": "e0127487aee3a00fe164d72eb697221079518471", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.670608287760864, "ground_truth": 0}, {"key": "e0127487aee3a00fe164d72eb697221079518471", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.6566582654355992, "ground_truth": 0}, {"key": "2f3af8decce1c0a6cd22b21df96acd40b14bb62b", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.10594827932733593, "ground_truth": 0}, {"key": "2f3af8decce1c0a6cd22b21df96acd40b14bb62b", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.466845587296098, "ground_truth": 0}, {"key": "2f3af8decce1c0a6cd22b21df96acd40b14bb62b", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.44360040216863944, "ground_truth": 0}, {"key": "2f3af8decce1c0a6cd22b21df96acd40b14bb62b", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.3090236832552318, "ground_truth": 0}, {"key": "2f3af8decce1c0a6cd22b21df96acd40b14bb62b", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.17895587145911165, "ground_truth": 0}, {"key": "13a366f303e6ea2f07c353a9f5fb49a44840f808", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.6584174994730364, "ground_truth": 0}, {"key": "13a366f303e6ea2f07c353a9f5fb49a44840f808", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.7154239967446853, "ground_truth": 0}, {"key": "13a366f303e6ea2f07c353a9f5fb49a44840f808", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.8333245942505804, "ground_truth": 0}, {"key": "13a366f303e6ea2f07c353a9f5fb49a44840f808", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.7620700932860652, "ground_truth": 0}, {"key": "13a366f303e6ea2f07c353a9f5fb49a44840f808", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.9012274085677024, "ground_truth": 0}, {"key": "ee36a8b5db09b9e9a6d462116539ffc095d5c017", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.6976089185015333, "ground_truth": 0}, {"key": "ee36a8b5db09b9e9a6d462116539ffc095d5c017", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.7520125844806435, "ground_truth": 0}, {"key": "ee36a8b5db09b9e9a6d462116539ffc095d5c017", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.437823492090109, "ground_truth": 0}, {"key": "ee36a8b5db09b9e9a6d462116539ffc095d5c017", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.8539127523192447, "ground_truth": 0}, {"key": "ee36a8b5db09b9e9a6d462116539ffc095d5c017", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.7217432103694265, "ground_truth": 0}, {"key": "d3b3bcf90226a694361cb27f1a4d481c79b7368a", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.6601723931743921, "ground_truth": 0}, {"key": "d3b3bcf90226a694361cb27f1a4d481c79b7368a", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.590779236301119, "ground_truth": 0}, {"key": "d3b3bcf90226a694361cb27f1a4d481c79b7368a", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.790530322884495, "ground_truth": 0}, {"key": "d3b3bcf90226a694361cb27f1a4d481c79b7368a", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.7341195310907167, "ground_truth": 0}, {"key": "d3b3bcf90226a694361cb27f1a4d481c79b7368a", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.84078259329658, "ground_truth": 0}, {"key": "e5e837f2cc75fc44ebf826822aa4c9dc59344b8b", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.5136684851165807, "ground_truth": 0}, {"key": "e5e837f2cc75fc44ebf826822aa4c9dc59344b8b", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.6424324718935446, "ground_truth": 0}, {"key": "e5e837f2cc75fc44ebf826822aa4c9dc59344b8b", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.5907791819267458, "ground_truth": 0}, {"key": "e5e837f2cc75fc44ebf826822aa4c9dc59344b8b", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.5869964243033733, "ground_truth": 0}, {"key": "e5e837f2cc75fc44ebf826822aa4c9dc59344b8b", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.4571367214864325, "ground_truth": 0}, {"key": "1317a869cc1d6d534a93eaad67fb6550aa155ae6", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.523420356621312, "ground_truth": 0}, {"key": "1317a869cc1d6d534a93eaad67fb6550aa155ae6", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.40922078658671224, "ground_truth": 0}, {"key": "1317a869cc1d6d534a93eaad67fb6550aa155ae6", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.42823342230861583, "ground_truth": 0}, {"key": "1317a869cc1d6d534a93eaad67fb6550aa155ae6", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.33633106794815, "ground_truth": 0}, {"key": "1317a869cc1d6d534a93eaad67fb6550aa155ae6", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.6992544148160745, "ground_truth": 0}, {"key": "f856ca4cd15992e0e88ae9113bf31b2a5ab55072", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.9224823354591797, "ground_truth": 0}, {"key": "f856ca4cd15992e0e88ae9113bf31b2a5ab55072", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.9224823491573241, "ground_truth": 0}, {"key": "f856ca4cd15992e0e88ae9113bf31b2a5ab55072", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.9637799440554149, "ground_truth": 0}, {"key": "f856ca4cd15992e0e88ae9113bf31b2a5ab55072", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.9575961681530503, "ground_truth": 0}, {"key": "f856ca4cd15992e0e88ae9113bf31b2a5ab55072", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.7826624758003371, "ground_truth": 0}, {"key": "438e8eaa1c64cb59288f9954355d0100181d19a2", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.8940517118398272, "ground_truth": 0}, {"key": "438e8eaa1c64cb59288f9954355d0100181d19a2", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.6688802582238137, "ground_truth": 0}, {"key": "438e8eaa1c64cb59288f9954355d0100181d19a2", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.8333245908859246, "ground_truth": 0}, {"key": "438e8eaa1c64cb59288f9954355d0100181d19a2", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.8031737892278871, "ground_truth": 0}, {"key": "438e8eaa1c64cb59288f9954355d0100181d19a2", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.830043775240435, "ground_truth": 0}, {"key": "470618f9fd48a5d134a44b5de166b625f596a0b3", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.6388352770153789, "ground_truth": 0}, {"key": "470618f9fd48a5d134a44b5de166b625f596a0b3", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.6688802758415333, "ground_truth": 0}, {"key": "470618f9fd48a5d134a44b5de166b625f596a0b3", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.8697145837115414, "ground_truth": 0}, {"key": "470618f9fd48a5d134a44b5de166b625f596a0b3", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.8164063716274353, "ground_truth": 0}, {"key": "470618f9fd48a5d134a44b5de166b625f596a0b3", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.7201714990138705, "ground_truth": 0}, {"key": "751e8f720d24c57e79cf63d9a3f72cd80c5d9619", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.6601723936195024, "ground_truth": 0}, {"key": "751e8f720d24c57e79cf63d9a3f72cd80c5d9619", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.41869691814586385, "ground_truth": 0}, {"key": "751e8f720d24c57e79cf63d9a3f72cd80c5d9619", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.4339814735367866, "ground_truth": 0}, {"key": "751e8f720d24c57e79cf63d9a3f72cd80c5d9619", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.5660185524544443, "ground_truth": 0}, {"key": "751e8f720d24c57e79cf63d9a3f72cd80c5d9619", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.4205995935499194, "ground_truth": 0}, {"key": "6a985a1090f146976d33c8b33342320a65a50211", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.3757064748663454, "ground_truth": 0}, {"key": "6a985a1090f146976d33c8b33342320a65a50211", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.18476750929554508, "ground_truth": 0}, {"key": "6a985a1090f146976d33c8b33342320a65a50211", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.2254166024909261, "ground_truth": 0}, {"key": "6a985a1090f146976d33c8b33342320a65a50211", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.2523840399425471, "ground_truth": 0}, {"key": "6a985a1090f146976d33c8b33342320a65a50211", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.3593641439570025, "ground_truth": 0}, {"key": "4640d2f968f31bcf384d8253e055611b10f4a38b", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.5078118734143795, "ground_truth": 0}, {"key": "4640d2f968f31bcf384d8253e055611b10f4a38b", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.5736784095410385, "ground_truth": 0}, {"key": "4640d2f968f31bcf384d8253e055611b10f4a38b", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.31573599069202335, "ground_truth": 0}, {"key": "4640d2f968f31bcf384d8253e055611b10f4a38b", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.16995623393725473, "ground_truth": 0}, {"key": "4640d2f968f31bcf384d8253e055611b10f4a38b", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.5234203552845755, "ground_truth": 0}, {"key": "22e0c9ba3465840583a5fd79714d2f7663c7e3a1", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.759225408929491, "ground_truth": 0}, {"key": "22e0c9ba3465840583a5fd79714d2f7663c7e3a1", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.7185943946809973, "ground_truth": 0}, {"key": "22e0c9ba3465840583a5fd79714d2f7663c7e3a1", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.7217432311126207, "ground_truth": 0}, {"key": "22e0c9ba3465840583a5fd79714d2f7663c7e3a1", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.7154239899401056, "ground_truth": 0}, {"key": "22e0c9ba3465840583a5fd79714d2f7663c7e3a1", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.7704647719960989, "ground_truth": 0}, {"key": "10dafcc21761c60f8fc5bd832daf8f21cf0fc66d", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.573678419817083, "ground_truth": 0}, {"key": "10dafcc21761c60f8fc5bd832daf8f21cf0fc66d", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.6169358162780041, "ground_truth": 0}, {"key": "10dafcc21761c60f8fc5bd832daf8f21cf0fc66d", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.4493926221305454, "ground_truth": 0}, {"key": "10dafcc21761c60f8fc5bd832daf8f21cf0fc66d", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.4765796646302189, "ground_truth": 0}, {"key": "10dafcc21761c60f8fc5bd832daf8f21cf0fc66d", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.6943026836470383, "ground_truth": 0}, {"key": "75da85a72e0028e1b07c65f6b771a1eaa20b4e04", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.8140528128074911, "ground_truth": 0}, {"key": "75da85a72e0028e1b07c65f6b771a1eaa20b4e04", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.6495786405273745, "ground_truth": 0}, {"key": "75da85a72e0028e1b07c65f6b771a1eaa20b4e04", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.5175708704340586, "ground_truth": 0}, {"key": "75da85a72e0028e1b07c65f6b771a1eaa20b4e04", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.6039318448305403, "ground_truth": 0}, {"key": "75da85a72e0028e1b07c65f6b771a1eaa20b4e04", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.8489722081264451, "ground_truth": 0}, {"key": "9166b4c77e919f7a7cc457f9df981512dea3694f", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.5832033695086214, "ground_truth": 0}, {"key": "9166b4c77e919f7a7cc457f9df981512dea3694f", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.37022540617401084, "ground_truth": 0}, {"key": "9166b4c77e919f7a7cc457f9df981512dea3694f", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.38121956630724957, "ground_truth": 0}, {"key": "9166b4c77e919f7a7cc457f9df981512dea3694f", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.6774739884216946, "ground_truth": 0}, {"key": "9166b4c77e919f7a7cc457f9df981512dea3694f", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.5078118688438442, "ground_truth": 0}, {"key": "81e50c6cdbea4e55af6307d653135ef395b6d7fe", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.913676525089077, "ground_truth": 0}, {"key": "81e50c6cdbea4e55af6307d653135ef395b6d7fe", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.8577681149247726, "ground_truth": 0}, {"key": "81e50c6cdbea4e55af6307d653135ef395b6d7fe", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.9615338047081792, "ground_truth": 0}, {"key": "81e50c6cdbea4e55af6307d653135ef395b6d7fe", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.824461919495907, "ground_truth": 0}, {"key": "81e50c6cdbea4e55af6307d653135ef395b6d7fe", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.9449947119017614, "ground_truth": 0}, {"key": "59fa6c3439d216272cc845d35627f8eb11b08a6d", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.9219218425468916, "ground_truth": 0}, {"key": "59fa6c3439d216272cc845d35627f8eb11b08a6d", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.9334308096648686, "ground_truth": 0}, {"key": "59fa6c3439d216272cc845d35627f8eb11b08a6d", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.8479677796415634, "ground_truth": 0}, {"key": "59fa6c3439d216272cc845d35627f8eb11b08a6d", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.8976952925698003, "ground_truth": 0}, {"key": "59fa6c3439d216272cc845d35627f8eb11b08a6d", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.9252299526883394, "ground_truth": 0}, {"key": "2eff3ba44cfaefbff89ebc764828ae9e4d477c9b", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.8152324886890664, "ground_truth": 0}, {"key": "2eff3ba44cfaefbff89ebc764828ae9e4d477c9b", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.5544704659900646, "ground_truth": 0}, {"key": "2eff3ba44cfaefbff89ebc764828ae9e4d477c9b", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.49414088932622025, "ground_truth": 0}, {"key": "2eff3ba44cfaefbff89ebc764828ae9e4d477c9b", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.8791467640244697, "ground_truth": 0}, {"key": "2eff3ba44cfaefbff89ebc764828ae9e4d477c9b", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.33111972975544074, "ground_truth": 0}, {"key": "74698ee383888faf5a49b32ecb8211b888270b76", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.6774740077475334, "ground_truth": 0}, {"key": "74698ee383888faf5a49b32ecb8211b888270b76", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.7025300558170714, "ground_truth": 0}, {"key": "74698ee383888faf5a49b32ecb8211b888270b76", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.7969253704819356, "ground_truth": 0}, {"key": "74698ee383888faf5a49b32ecb8211b888270b76", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.7826624849845121, "ground_truth": 0}, {"key": "74698ee383888faf5a49b32ecb8211b888270b76", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.5117166104831059, "ground_truth": 0}, {"key": "79a6d24f452d8c1cef47ab224fd2083b0d08324c", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.6150878508004233, "ground_truth": 0}, {"key": "79a6d24f452d8c1cef47ab224fd2083b0d08324c", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.770464825012964, "ground_truth": 0}, {"key": "79a6d24f452d8c1cef47ab224fd2083b0d08324c", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.7534666461515437, "ground_truth": 0}, {"key": "79a6d24f452d8c1cef47ab224fd2083b0d08324c", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.6442251132256336, "ground_truth": 0}, {"key": "79a6d24f452d8c1cef47ab224fd2083b0d08324c", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.8068526209377782, "ground_truth": 0}, {"key": "50f2041a2bed7f316d3254192c4158095eeec2e9", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.3208213090956478, "ground_truth": 0}, {"key": "50f2041a2bed7f316d3254192c4158095eeec2e9", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.37570647254144496, "ground_truth": 0}, {"key": "50f2041a2bed7f316d3254192c4158095eeec2e9", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.49609382276956737, "ground_truth": 0}, {"key": "50f2041a2bed7f316d3254192c4158095eeec2e9", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.3757064731241336, "ground_truth": 0}, {"key": "50f2041a2bed7f316d3254192c4158095eeec2e9", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.6315942829819119, "ground_truth": 0}, {"key": "de6ed8db6d639706f2c5015c699fc578e4aa43ec", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.5448014159695735, "ground_truth": 0}, {"key": "de6ed8db6d639706f2c5015c699fc578e4aa43ec", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.4921881346455882, "ground_truth": 0}, {"key": "de6ed8db6d639706f2c5015c699fc578e4aa43ec", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.529263398055368, "ground_truth": 0}, {"key": "de6ed8db6d639706f2c5015c699fc578e4aa43ec", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.3849121555727376, "ground_truth": 0}, {"key": "de6ed8db6d639706f2c5015c699fc578e4aa43ec", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.6531269037192928, "ground_truth": 0}, {"key": "8abb66a9697a8c59348fcc79de126691e394bded", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.9019206775047894, "ground_truth": 0}, {"key": "8abb66a9697a8c59348fcc79de126691e394bded", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.6976089233834685, "ground_truth": 0}, {"key": "8abb66a9697a8c59348fcc79de126691e394bded", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.7969253757977607, "ground_truth": 0}, {"key": "8abb66a9697a8c59348fcc79de126691e394bded", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.882427861488816, "ground_truth": 0}, {"key": "8abb66a9697a8c59348fcc79de126691e394bded", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.7759445425718402, "ground_truth": 0}, {"key": "11ec3be451b57e4312b44eeabb3ae441435c662e", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.6057990581647024, "ground_truth": 0}, {"key": "11ec3be451b57e4312b44eeabb3ae441435c662e", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.7138307390436858, "ground_truth": 0}, {"key": "11ec3be451b57e4312b44eeabb3ae441435c662e", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.6169358235123086, "ground_truth": 0}, {"key": "11ec3be451b57e4312b44eeabb3ae441435c662e", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.7356416352137495, "ground_truth": 0}, {"key": "11ec3be451b57e4312b44eeabb3ae441435c662e", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.830043771410498, "ground_truth": 0}, {"key": "eed527dece78deffed54a7cdd8516c4d57a90011", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.8887587922536935, "ground_truth": 0}, {"key": "eed527dece78deffed54a7cdd8516c4d57a90011", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.8044059174569225, "ground_truth": 0}, {"key": "eed527dece78deffed54a7cdd8516c4d57a90011", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.8624675244543808, "ground_truth": 0}, {"key": "eed527dece78deffed54a7cdd8516c4d57a90011", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.9367494717683029, "ground_truth": 0}, {"key": "eed527dece78deffed54a7cdd8516c4d57a90011", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.8255897318791846, "ground_truth": 0}, {"key": "803c0dc8b3d2eb528fd084b613dfc29d98151d72", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.7356416452583376, "ground_truth": 0}, {"key": "803c0dc8b3d2eb528fd084b613dfc29d98151d72", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.642432467252211, "ground_truth": 0}, {"key": "803c0dc8b3d2eb528fd084b613dfc29d98151d72", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.6406358501412551, "ground_truth": 0}, {"key": "803c0dc8b3d2eb528fd084b613dfc29d98151d72", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.8879840433619061, "ground_truth": 0}, {"key": "803c0dc8b3d2eb528fd084b613dfc29d98151d72", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.6187804321665565, "ground_truth": 0}, {"key": "d4fb4cca753c0f5586bd93bb124b0491711396d9", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.7185943755144168, "ground_truth": 0}, {"key": "d4fb4cca753c0f5586bd93bb124b0491711396d9", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.7325918283692009, "ground_truth": 0}, {"key": "d4fb4cca753c0f5586bd93bb124b0491711396d9", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.3886180201076617, "ground_truth": 0}, {"key": "d4fb4cca753c0f5586bd93bb124b0491711396d9", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.6548947213782671, "ground_truth": 0}, {"key": "d4fb4cca753c0f5586bd93bb124b0491711396d9", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.6020616100087346, "ground_truth": 0}, {"key": "723443b1c16e2276a1aa03259a600044e86c2538", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.7217431998523239, "ground_truth": 0}, {"key": "723443b1c16e2276a1aa03259a600044e86c2538", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.6992544222441258, "ground_truth": 0}, {"key": "723443b1c16e2276a1aa03259a600044e86c2538", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.67405049874391, "ground_truth": 0}, {"key": "723443b1c16e2276a1aa03259a600044e86c2538", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.6460137123538314, "ground_truth": 0}, {"key": "723443b1c16e2276a1aa03259a600044e86c2538", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.5602526889469948, "ground_truth": 0}, {"key": "b30a8f4dbb4f8375a8a9c2ccb4f658cc66dca0f5", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.5621764860019008, "ground_truth": 0}, {"key": "b30a8f4dbb4f8375a8a9c2ccb4f658cc66dca0f5", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.22270014555298404, "ground_truth": 0}, {"key": "b30a8f4dbb4f8375a8a9c2ccb4f658cc66dca0f5", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.2782567988661012, "ground_truth": 0}, {"key": "b30a8f4dbb4f8375a8a9c2ccb4f658cc66dca0f5", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.47852883435541277, "ground_truth": 0}, {"key": "b30a8f4dbb4f8375a8a9c2ccb4f658cc66dca0f5", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.7549149867416142, "ground_truth": 0}, {"key": "f874dc1da36d2c45a65f78dc0dc9dcdf5846c3c9", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.629774606390871, "ground_truth": 0}, {"key": "f874dc1da36d2c45a65f78dc0dc9dcdf5846c3c9", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.8221891185960643, "ground_truth": 0}, {"key": "f874dc1da36d2c45a65f78dc0dc9dcdf5846c3c9", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.5851011459631751, "ground_truth": 0}, {"key": "f874dc1da36d2c45a65f78dc0dc9dcdf5846c3c9", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.6654105672342475, "ground_truth": 0}, {"key": "f874dc1da36d2c45a65f78dc0dc9dcdf5846c3c9", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.40544872738931687, "ground_truth": 0}, {"key": "60fc2801c429858cc0a87e547f1c30e34a7a96f3", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.42632159805838094, "ground_truth": 0}, {"key": "60fc2801c429858cc0a87e547f1c30e34a7a96f3", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.6095241897437917, "ground_truth": 0}, {"key": "60fc2801c429858cc0a87e547f1c30e34a7a96f3", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.577495392184226, "ground_truth": 0}, {"key": "60fc2801c429858cc0a87e547f1c30e34a7a96f3", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.558326998493142, "ground_truth": 0}, {"key": "60fc2801c429858cc0a87e547f1c30e34a7a96f3", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.7090191219249474, "ground_truth": 0}, {"key": "d885b755dab03a11c7e3b19455b82859a6e1f76b", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.7371581455857427, "ground_truth": 0}, {"key": "d885b755dab03a11c7e3b19455b82859a6e1f76b", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.7577943731657065, "ground_truth": 0}, {"key": "d885b755dab03a11c7e3b19455b82859a6e1f76b", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.6001883395665091, "ground_truth": 0}, {"key": "d885b755dab03a11c7e3b19455b82859a6e1f76b", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.5292633884612883, "ground_truth": 0}, {"key": "d885b755dab03a11c7e3b19455b82859a6e1f76b", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.6531269175923464, "ground_truth": 0}, {"key": "9ce486aae2ad61c78b2e44d2617276a470c9f600", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.6808786207752291, "ground_truth": 0}, {"key": "9ce486aae2ad61c78b2e44d2617276a470c9f600", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.658417499843232, "ground_truth": 0}, {"key": "9ce486aae2ad61c78b2e44d2617276a470c9f600", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.7106282999883707, "ground_truth": 0}, {"key": "9ce486aae2ad61c78b2e44d2617276a470c9f600", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.6057990413513897, "ground_truth": 0}, {"key": "9ce486aae2ad61c78b2e44d2617276a470c9f600", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.5621765090063802, "ground_truth": 0}, {"key": "162e54974cad1d0e067a97e37175951c26f13a0e", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.943347574620809, "ground_truth": 0}, {"key": "162e54974cad1d0e067a97e37175951c26f13a0e", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.7918210675211064, "ground_truth": 0}, {"key": "162e54974cad1d0e067a97e37175951c26f13a0e", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.8386797556157507, "ground_truth": 0}, {"key": "162e54974cad1d0e067a97e37175951c26f13a0e", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.8962513682522671, "ground_truth": 0}, {"key": "162e54974cad1d0e067a97e37175951c26f13a0e", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.9289263328638947, "ground_truth": 0}, {"key": "03a0cef9c902928979ef731616fb96bd1fb10f9f", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.724870266883345, "ground_truth": 0}, {"key": "03a0cef9c902928979ef731616fb96bd1fb10f9f", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.7981867674934746, "ground_truth": 0}, {"key": "03a0cef9c902928979ef731616fb96bd1fb10f9f", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.7325918381471046, "ground_truth": 0}, {"key": "03a0cef9c902928979ef731616fb96bd1fb10f9f", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.9268352781577444, "ground_truth": 0}, {"key": "03a0cef9c902928979ef731616fb96bd1fb10f9f", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.5907791960648582, "ground_truth": 0}, {"key": "6f64897fc65e1ba7531a4830a7d935ab15d8bec6", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.6388352792369072, "ground_truth": 0}, {"key": "6f64897fc65e1ba7531a4830a7d935ab15d8bec6", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.3867634343959158, "ground_truth": 0}, {"key": "6f64897fc65e1ba7531a4830a7d935ab15d8bec6", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.640635863716883, "ground_truth": 0}, {"key": "6f64897fc65e1ba7531a4830a7d935ab15d8bec6", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.505859102860858, "ground_truth": 0}, {"key": "6f64897fc65e1ba7531a4830a7d935ab15d8bec6", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.4054486928185305, "ground_truth": 0}, {"key": "0d7383a44955b41c5a472151a35a842751f0004c", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.6442251210882869, "ground_truth": 0}, {"key": "0d7383a44955b41c5a472151a35a842751f0004c", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.656658263332394, "ground_truth": 0}, {"key": "0d7383a44955b41c5a472151a35a842751f0004c", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.5058590949283311, "ground_truth": 0}, {"key": "0d7383a44955b41c5a472151a35a842751f0004c", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.6825737328156158, "ground_truth": 0}, {"key": "0d7383a44955b41c5a472151a35a842751f0004c", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.5832033422732753, "ground_truth": 0}, {"key": "2fddefe691f7849048548a15f6533339d4a25bfd", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.5983122054395544, "ground_truth": 0}, {"key": "2fddefe691f7849048548a15f6533339d4a25bfd", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.6723316966043053, "ground_truth": 0}, {"key": "2fddefe691f7849048548a15f6533339d4a25bfd", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.6548947104725804, "ground_truth": 0}, {"key": "2fddefe691f7849048548a15f6533339d4a25bfd", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.7534666524954091, "ground_truth": 0}, {"key": "2fddefe691f7849048548a15f6533339d4a25bfd", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.6740504767874254, "ground_truth": 0}, {"key": "e35ec8afe496d466d673ac67d80ec5c21b163410", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.43974733733764443, "ground_truth": 0}, {"key": "e35ec8afe496d466d673ac67d80ec5c21b163410", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.22270014555298404, "ground_truth": 0}, {"key": "e35ec8afe496d466d673ac67d80ec5c21b163410", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.42441198589850043, "ground_truth": 0}, {"key": "e35ec8afe496d466d673ac67d80ec5c21b163410", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.5214711869520301, "ground_truth": 0}, {"key": "e35ec8afe496d466d673ac67d80ec5c21b163410", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.7718435039749407, "ground_truth": 0}, {"key": "b4aa207f0723ae8a731dbc07ecdb03a68a42031f", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.5506073696730786, "ground_truth": 0}, {"key": "b4aa207f0723ae8a731dbc07ecdb03a68a42031f", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.3904758305536039, "ground_truth": 0}, {"key": "b4aa207f0723ae8a731dbc07ecdb03a68a42031f", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.31742627431298565, "ground_truth": 0}, {"key": "b4aa207f0723ae8a731dbc07ecdb03a68a42031f", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.5851011551206818, "ground_truth": 0}, {"key": "b4aa207f0723ae8a731dbc07ecdb03a68a42031f", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.3904758336919734, "ground_truth": 0}, {"key": "a65ecd71682863f7b12ca11ab8ac23b39ae302c4", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.548673499408768, "ground_truth": 0}, {"key": "a65ecd71682863f7b12ca11ab8ac23b39ae302c4", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.8615382016236718, "ground_truth": 0}, {"key": "a65ecd71682863f7b12ca11ab8ac23b39ae302c4", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.5312093870445234, "ground_truth": 0}, {"key": "a65ecd71682863f7b12ca11ab8ac23b39ae302c4", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.5467381380720095, "ground_truth": 0}, {"key": "a65ecd71682863f7b12ca11ab8ac23b39ae302c4", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.631594279519928, "ground_truth": 0}, {"key": "215a2a64c7bd36360f76ec5e159690de07d7d959", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.3720488000834839, "ground_truth": 0}, {"key": "215a2a64c7bd36360f76ec5e159690de07d7d959", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.5717666247437047, "ground_truth": 0}, {"key": "215a2a64c7bd36360f76ec5e159690de07d7d959", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.3849121660999978, "ground_truth": 0}, {"key": "215a2a64c7bd36360f76ec5e159690de07d7d959", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.4474603124780186, "ground_truth": 0}, {"key": "215a2a64c7bd36360f76ec5e159690de07d7d959", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.4610167973990871, "ground_truth": 0}, {"key": "39074eb06df4966d1e06f76ad2f0713b31335fe5", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.8397339740378708, "ground_truth": 0}, {"key": "39074eb06df4966d1e06f76ad2f0713b31335fe5", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.7341195210685416, "ground_truth": 0}, {"key": "39074eb06df4966d1e06f76ad2f0713b31335fe5", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.8840392780235027, "ground_truth": 0}, {"key": "39074eb06df4966d1e06f76ad2f0713b31335fe5", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.8799743586071013, "ground_truth": 0}, {"key": "39074eb06df4966d1e06f76ad2f0713b31335fe5", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.8140528119790428, "ground_truth": 0}, {"key": "3cae0d9bcf97b5d182b20a31aaea3f41cd7bf599", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.4571367122816213, "ground_truth": 0}, {"key": "3cae0d9bcf97b5d182b20a31aaea3f41cd7bf599", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.6706082836480801, "ground_truth": 0}, {"key": "3cae0d9bcf97b5d182b20a31aaea3f41cd7bf599", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.45132652201861445, "ground_truth": 0}, {"key": "3cae0d9bcf97b5d182b20a31aaea3f41cd7bf599", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.4016878135970889, "ground_truth": 0}, {"key": "3cae0d9bcf97b5d182b20a31aaea3f41cd7bf599", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.5467381453411324, "ground_truth": 0}, {"key": "6a9ead70f9423e494c466189bc6d907071547f42", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.9066531200811391, "ground_truth": 0}, {"key": "6a9ead70f9423e494c466189bc6d907071547f42", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.9640516782889282, "ground_truth": 0}, {"key": "6a9ead70f9423e494c466189bc6d907071547f42", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.9304582591630769, "ground_truth": 0}, {"key": "6a9ead70f9423e494c466189bc6d907071547f42", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.941223441140446, "ground_truth": 0}, {"key": "6a9ead70f9423e494c466189bc6d907071547f42", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.914900958862292, "ground_truth": 0}, {"key": "9a15663058028878027f6aa039fb3185c2ff52c8", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.6723316979664553, "ground_truth": 0}, {"key": "9a15663058028878027f6aa039fb3185c2ff52c8", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.5525397014870903, "ground_truth": 0}, {"key": "9a15663058028878027f6aa039fb3185c2ff52c8", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.2942149638290767, "ground_truth": 0}, {"key": "9a15663058028878027f6aa039fb3185c2ff52c8", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.3174262766002964, "ground_truth": 0}, {"key": "9a15663058028878027f6aa039fb3185c2ff52c8", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.3380771328754638, "ground_truth": 0}, {"key": "83cb0c7e79d4c71703e1bd5fc346fe68be8b8b13", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.6352224520069475, "ground_truth": 0}, {"key": "83cb0c7e79d4c71703e1bd5fc346fe68be8b8b13", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.6688802649864374, "ground_truth": 0}, {"key": "83cb0c7e79d4c71703e1bd5fc346fe68be8b8b13", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.6671476621081971, "ground_truth": 0}, {"key": "83cb0c7e79d4c71703e1bd5fc346fe68be8b8b13", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.5175708849830413, "ground_truth": 0}, {"key": "83cb0c7e79d4c71703e1bd5fc346fe68be8b8b13", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.5486734721906973, "ground_truth": 0}, {"key": "5eb63517219a5d2aeebd21aa66d9b69c52cfb208", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.8344068805846644, "ground_truth": 0}, {"key": "5eb63517219a5d2aeebd21aa66d9b69c52cfb208", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.39420094782514287, "ground_truth": 0}, {"key": "5eb63517219a5d2aeebd21aa66d9b69c52cfb208", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.5467381524990926, "ground_truth": 0}, {"key": "5eb63517219a5d2aeebd21aa66d9b69c52cfb208", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.6495786288037773, "ground_truth": 0}, {"key": "5eb63517219a5d2aeebd21aa66d9b69c52cfb208", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.7371581575283873, "ground_truth": 0}, {"key": "4a1de02b50578df33ea7b0cb384bdd6aaf4ee119", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.3647775709503496, "ground_truth": 0}, {"key": "4a1de02b50578df33ea7b0cb384bdd6aaf4ee119", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.5331544014499884, "ground_truth": 0}, {"key": "4a1de02b50578df33ea7b0cb384bdd6aaf4ee119", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.2845760125151018, "ground_truth": 0}, {"key": "4a1de02b50578df33ea7b0cb384bdd6aaf4ee119", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.26284185220426837, "ground_truth": 0}, {"key": "4a1de02b50578df33ea7b0cb384bdd6aaf4ee119", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.5370413906769317, "ground_truth": 0}, {"key": "ddedfc2a349fb607ed7efeda1660e9807454ddb7", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.5717665926897126, "ground_truth": 0}, {"key": "ddedfc2a349fb607ed7efeda1660e9807454ddb7", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.8519528132942374, "ground_truth": 0}, {"key": "ddedfc2a349fb607ed7efeda1660e9807454ddb7", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.4726834990559493, "ground_truth": 0}, {"key": "ddedfc2a349fb607ed7efeda1660e9807454ddb7", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.8019358393392034, "ground_truth": 0}, {"key": "ddedfc2a349fb607ed7efeda1660e9807454ddb7", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.7505527664456275, "ground_truth": 0}, {"key": "1cce8238a161fda411022c350d2b9a49072f366f", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.5273165418132968, "ground_truth": 0}, {"key": "1cce8238a161fda411022c350d2b9a49072f366f", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.7371581493339997, "ground_truth": 0}, {"key": "1cce8238a161fda411022c350d2b9a49072f366f", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.7248702737581947, "ground_truth": 0}, {"key": "1cce8238a161fda411022c350d2b9a49072f366f", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.8976952976799772, "ground_truth": 0}, {"key": "1cce8238a161fda411022c350d2b9a49072f366f", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.6740504714910265, "ground_truth": 0}, {"key": "0612042c0c7d5cf6459f5435402919673c8c552f", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.3757064898776741, "ground_truth": 0}, {"key": "0612042c0c7d5cf6459f5435402919673c8c552f", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.4167966332522258, "ground_truth": 0}, {"key": "0612042c0c7d5cf6459f5435402919673c8c552f", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.4073334061064853, "ground_truth": 0}, {"key": "0612042c0c7d5cf6459f5435402919673c8c552f", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.26740815831869774, "ground_truth": 0}, {"key": "0612042c0c7d5cf6459f5435402919673c8c552f", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.4416730206243506, "ground_truth": 0}, {"key": "cbe1f7ee7f5d619093684cc123e3908e39d79c92", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.7813306287363722, "ground_truth": 0}, {"key": "cbe1f7ee7f5d619093684cc123e3908e39d79c92", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.6370308025018545, "ground_truth": 0}, {"key": "cbe1f7ee7f5d619093684cc123e3908e39d79c92", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.8568122852950038, "ground_truth": 0}, {"key": "cbe1f7ee7f5d619093684cc123e3908e39d79c92", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.592666596689856, "ground_truth": 0}, {"key": "cbe1f7ee7f5d619093684cc123e3908e39d79c92", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.7662936503767382, "ground_truth": 0}, {"key": "42be47d5986a9a55b413eb57359d2d8c51b59024", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.5698526448589228, "ground_truth": 0}, {"key": "42be47d5986a9a55b413eb57359d2d8c51b59024", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.6757646147523058, "ground_truth": 0}, {"key": "42be47d5986a9a55b413eb57359d2d8c51b59024", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.3174262718021759, "ground_truth": 0}, {"key": "42be47d5986a9a55b413eb57359d2d8c51b59024", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.3923368278258421, "ground_truth": 0}, {"key": "42be47d5986a9a55b413eb57359d2d8c51b59024", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.6334102545080443, "ground_truth": 0}, {"key": "9f997964709283520a65d2ce75de7c8b154ce351", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.45326185704279565, "ground_truth": 0}, {"key": "9f997964709283520a65d2ce75de7c8b154ce351", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.3123700105894007, "ground_truth": 0}, {"key": "9f997964709283520a65d2ce75de7c8b154ce351", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.3757064670190525, "ground_truth": 0}, {"key": "9f997964709283520a65d2ce75de7c8b154ce351", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.3191213904597881, "ground_truth": 0}, {"key": "9f997964709283520a65d2ce75de7c8b154ce351", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.428233395961496, "ground_truth": 0}, {"key": "57da930302d81b46438b0f715a5218b7174a5611", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.8766343681200555, "ground_truth": 0}, {"key": "57da930302d81b46438b0f715a5218b7174a5611", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.8140528079912372, "ground_truth": 0}, {"key": "57da930302d81b46438b0f715a5218b7174a5611", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.8895288582179263, "ground_truth": 0}, {"key": "57da930302d81b46438b0f715a5218b7174a5611", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.9504109784715169, "ground_truth": 0}, {"key": "57da930302d81b46438b0f715a5218b7174a5611", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.9213576240367557, "ground_truth": 0}, {"key": "bc639974d283826b3b928bf90f0951652db71fd4", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.6224593151148208, "ground_truth": 0}, {"key": "bc639974d283826b3b928bf90f0951652db71fd4", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.6388352936760365, "ground_truth": 0}, {"key": "bc639974d283826b3b928bf90f0951652db71fd4", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.5832033454645268, "ground_truth": 0}, {"key": "bc639974d283826b3b928bf90f0951652db71fd4", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.6352224301175107, "ground_truth": 0}, {"key": "bc639974d283826b3b928bf90f0951652db71fd4", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.8140528077718336, "ground_truth": 0}, {"key": "304002bc095b57d14b728ccfb8d704ef39f28813", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.5097644188726205, "ground_truth": 0}, {"key": "304002bc095b57d14b728ccfb8d704ef39f28813", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.7138307706799316, "ground_truth": 0}, {"key": "304002bc095b57d14b728ccfb8d704ef39f28813", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.6531268933925966, "ground_truth": 0}, {"key": "304002bc095b57d14b728ccfb8d704ef39f28813", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.7154240207938231, "ground_truth": 0}, {"key": "304002bc095b57d14b728ccfb8d704ef39f28813", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.7786493200008051, "ground_truth": 0}, {"key": "fab941df6ecc8251b49d28715504baf4ac31dcf9", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.5389831985961074, "ground_truth": 0}, {"key": "fab941df6ecc8251b49d28715504baf4ac31dcf9", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.5888891295293825, "ground_truth": 0}, {"key": "fab941df6ecc8251b49d28715504baf4ac31dcf9", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.43782348686523415, "ground_truth": 0}, {"key": "fab941df6ecc8251b49d28715504baf4ac31dcf9", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.46101677423253634, "ground_truth": 0}, {"key": "fab941df6ecc8251b49d28715504baf4ac31dcf9", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.6057990679785267, "ground_truth": 0}, {"key": "92dec9732f4244771770150d82cd6086f40e5621", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.5136684987980331, "ground_truth": 0}, {"key": "92dec9732f4244771770150d82cd6086f40e5621", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.65665824950745, "ground_truth": 0}, {"key": "92dec9732f4244771770150d82cd6086f40e5621", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.5832033716009755, "ground_truth": 0}, {"key": "92dec9732f4244771770150d82cd6086f40e5621", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.6150878369117287, "ground_truth": 0}, {"key": "92dec9732f4244771770150d82cd6086f40e5621", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.6020615756721243, "ground_truth": 0}, {"key": "d2ed554726c632af6e2130a580964a261f8c2e60", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.2782568009377407, "ground_truth": 0}, {"key": "d2ed554726c632af6e2130a580964a261f8c2e60", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.418696921615203, "ground_truth": 0}, {"key": "d2ed554726c632af6e2130a580964a261f8c2e60", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.31237000793106895, "ground_truth": 0}, {"key": "d2ed554726c632af6e2130a580964a261f8c2e60", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.4035668688285648, "ground_truth": 0}, {"key": "d2ed554726c632af6e2130a580964a261f8c2e60", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.3468730812238726, "ground_truth": 0}, {"key": "84ab5256295369509813877f5000bb7e01e7f641", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.7853085726634356, "ground_truth": 0}, {"key": "84ab5256295369509813877f5000bb7e01e7f641", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.6150878519288488, "ground_truth": 0}, {"key": "84ab5256295369509813877f5000bb7e01e7f641", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.754914990747274, "ground_truth": 0}, {"key": "84ab5256295369509813877f5000bb7e01e7f641", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.8705972641828514, "ground_truth": 0}, {"key": "84ab5256295369509813877f5000bb7e01e7f641", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.649578617879091, "ground_truth": 0}, {"key": "0e3f2fa30b711144fd8e49dedd6c248542a9083c", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.8940517194050985, "ground_truth": 0}, {"key": "0e3f2fa30b711144fd8e49dedd6c248542a9083c", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.8749346118602179, "ground_truth": 0}, {"key": "0e3f2fa30b711144fd8e49dedd6c248542a9083c", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.8807970809800904, "ground_truth": 0}, {"key": "0e3f2fa30b711144fd8e49dedd6c248542a9083c", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.8799743772595644, "ground_truth": 0}, {"key": "0e3f2fa30b711144fd8e49dedd6c248542a9083c", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.893309405610607, "ground_truth": 0}, {"key": "67ab697c3e2d707e3b7d070199b065b1541c8925", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.7217432111389162, "ground_truth": 0}, {"key": "67ab697c3e2d707e3b7d070199b065b1541c8925", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.6757645819763614, "ground_truth": 0}, {"key": "67ab697c3e2d707e3b7d070199b065b1541c8925", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.6057990429068633, "ground_truth": 0}, {"key": "67ab697c3e2d707e3b7d070199b065b1541c8925", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.6442250989732914, "ground_truth": 0}, {"key": "67ab697c3e2d707e3b7d070199b065b1541c8925", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.723309483430804, "ground_truth": 0}, {"key": "71537a701b69838dcb68ae310c7b3bfb375c1344", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.2146914164236853, "ground_truth": 0}, {"key": "71537a701b69838dcb68ae310c7b3bfb375c1344", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.2829881420176225, "ground_truth": 0}, {"key": "71537a701b69838dcb68ae310c7b3bfb375c1344", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.3942009436912576, "ground_truth": 0}, {"key": "71537a701b69838dcb68ae310c7b3bfb375c1344", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.20055768565614068, "ground_truth": 0}, {"key": "71537a701b69838dcb68ae310c7b3bfb375c1344", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.27202457119780343, "ground_truth": 0}, {"key": "83989da5142972bb45c7f1e25ea60c6b101a9987", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.6150878411568734, "ground_truth": 0}, {"key": "83989da5142972bb45c7f1e25ea60c6b101a9987", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.6740504707474387, "ground_truth": 0}, {"key": "83989da5142972bb45c7f1e25ea60c6b101a9987", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.7090191382176065, "ground_truth": 0}, {"key": "83989da5142972bb45c7f1e25ea60c6b101a9987", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.6460136985071221, "ground_truth": 0}, {"key": "83989da5142972bb45c7f1e25ea60c6b101a9987", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.7264256055491989, "ground_truth": 0}, {"key": "cc432e8a26891d7fcb62b112f868e994532a7ba7", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.3629691995984338, "ground_truth": 0}, {"key": "cc432e8a26891d7fcb62b112f868e994532a7ba7", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.39047582920476637, "ground_truth": 0}, {"key": "cc432e8a26891d7fcb62b112f868e994532a7ba7", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.5350984148173438, "ground_truth": 0}, {"key": "cc432e8a26891d7fcb62b112f868e994532a7ba7", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.38121956959313763, "ground_truth": 0}, {"key": "cc432e8a26891d7fcb62b112f868e994532a7ba7", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.5312093854973452, "ground_truth": 0}, {"key": "ef024e4ca04bd445d2915e7fe5c2c3c9b6f723a2", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.424411984413913, "ground_truth": 0}, {"key": "ef024e4ca04bd445d2915e7fe5c2c3c9b6f723a2", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.4474602944480813, "ground_truth": 0}, {"key": "ef024e4ca04bd445d2915e7fe5c2c3c9b6f723a2", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.49804691168802745, "ground_truth": 0}, {"key": "ef024e4ca04bd445d2915e7fe5c2c3c9b6f723a2", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.37022542323745306, "ground_truth": 0}, {"key": "ef024e4ca04bd445d2915e7fe5c2c3c9b6f723a2", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.3433417331135946, "ground_truth": 0}, {"key": "dfc606b97c43ac249d72cff2fe812213987a37a2", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.3867634656460167, "ground_truth": 0}, {"key": "dfc606b97c43ac249d72cff2fe812213987a37a2", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.24077460152453076, "ground_truth": 0}, {"key": "dfc606b97c43ac249d72cff2fe812213987a37a2", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.32082132030998106, "ground_truth": 0}, {"key": "dfc606b97c43ac249d72cff2fe812213987a37a2", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.2958398651983051, "ground_truth": 0}, {"key": "dfc606b97c43ac249d72cff2fe812213987a37a2", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.2991051927127504, "ground_truth": 0}, {"key": "087ac92e2ca469b5ca6277950e63b2f0706d0de2", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.3830641964772855, "ground_truth": 0}, {"key": "087ac92e2ca469b5ca6277950e63b2f0706d0de2", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.31912138633461373, "ground_truth": 0}, {"key": "087ac92e2ca469b5ca6277950e63b2f0706d0de2", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.3328523270007513, "ground_truth": 0}, {"key": "087ac92e2ca469b5ca6277950e63b2f0706d0de2", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.40168780292812045, "ground_truth": 0}, {"key": "087ac92e2ca469b5ca6277950e63b2f0706d0de2", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.22135069238616442, "ground_truth": 0}, {"key": "a1abb9ce1c76a6c390233d8ec934cfb34bc35215", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.7310585540827853, "ground_truth": 0}, {"key": "a1abb9ce1c76a6c390233d8ec934cfb34bc35215", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.588889135013503, "ground_truth": 0}, {"key": "a1abb9ce1c76a6c390233d8ec934cfb34bc35215", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.6876299927084765, "ground_truth": 0}, {"key": "a1abb9ce1c76a6c390233d8ec934cfb34bc35215", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.8300437639418313, "ground_truth": 0}, {"key": "a1abb9ce1c76a6c390233d8ec934cfb34bc35215", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.7704647848744285, "ground_truth": 0}, {"key": "99ec57979392a7f9c1a24158d5e1262cdf113f45", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.7170118642333367, "ground_truth": 0}, {"key": "99ec57979392a7f9c1a24158d5e1262cdf113f45", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.6513548606986556, "ground_truth": 0}, {"key": "99ec57979392a7f9c1a24158d5e1262cdf113f45", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.801935828350271, "ground_truth": 0}, {"key": "99ec57979392a7f9c1a24158d5e1262cdf113f45", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.6584174900708712, "ground_truth": 0}, {"key": "99ec57979392a7f9c1a24158d5e1262cdf113f45", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.7676898387811184, "ground_truth": 0}, {"key": "ca5c0c816376354b82a4a7b9fa9a31b655e2d2cd", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.5428632805993234, "ground_truth": 0}, {"key": "ca5c0c816376354b82a4a7b9fa9a31b655e2d2cd", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.3191213997893232, "ground_truth": 0}, {"key": "ca5c0c816376354b82a4a7b9fa9a31b655e2d2cd", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.4941408730696043, "ground_truth": 0}, {"key": "ca5c0c816376354b82a4a7b9fa9a31b655e2d2cd", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.43974734262417003, "ground_truth": 0}, {"key": "ca5c0c816376354b82a4a7b9fa9a31b655e2d2cd", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.4726834754287317, "ground_truth": 0}, {"key": "e9787bf9462b12b7dfc0b562510a551e7d07b4d7", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.519521311681377, "ground_truth": 0}, {"key": "e9787bf9462b12b7dfc0b562510a551e7d07b4d7", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.7534666666065019, "ground_truth": 0}, {"key": "e9787bf9462b12b7dfc0b562510a551e7d07b4d7", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.7969253809990725, "ground_truth": 0}, {"key": "e9787bf9462b12b7dfc0b562510a551e7d07b4d7", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.5331543976384117, "ground_truth": 0}, {"key": "e9787bf9462b12b7dfc0b562510a551e7d07b4d7", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.6001883567595686, "ground_truth": 0}, {"key": "ed8a7d5b06b4b5415725e624a15ab5ada7146894", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.8056321873218513, "ground_truth": 0}, {"key": "ed8a7d5b06b4b5415725e624a15ab5ada7146894", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.854884636457592, "ground_truth": 0}, {"key": "ed8a7d5b06b4b5415725e624a15ab5ada7146894", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.8198933389675999, "ground_truth": 0}, {"key": "ed8a7d5b06b4b5415725e624a15ab5ada7146894", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.853912756913728, "ground_truth": 0}, {"key": "ed8a7d5b06b4b5415725e624a15ab5ada7146894", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.7969253623964845, "ground_truth": 0}, {"key": "4b6f2532f6bb4cf4ae341e4fb72d384ef58f0f42", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.40733339664955087, "ground_truth": 0}, {"key": "4b6f2532f6bb4cf4ae341e4fb72d384ef58f0f42", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.5350984294658596, "ground_truth": 0}, {"key": "4b6f2532f6bb4cf4ae341e4fb72d384ef58f0f42", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.5813030953825719, "ground_truth": 0}, {"key": "4b6f2532f6bb4cf4ae341e4fb72d384ef58f0f42", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.3849121613203263, "ground_truth": 0}, {"key": "4b6f2532f6bb4cf4ae341e4fb72d384ef58f0f42", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.18832398096467565, "ground_truth": 0}, {"key": "46102a68e2927f930c1c2bd117ca714d188cd1ab", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.5888891202177351, "ground_truth": 0}, {"key": "46102a68e2927f930c1c2bd117ca714d188cd1ab", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.5544704515130876, "ground_truth": 0}, {"key": "46102a68e2927f930c1c2bd117ca714d188cd1ab", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.6242935289475626, "ground_truth": 0}, {"key": "46102a68e2927f930c1c2bd117ca714d188cd1ab", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.5097643732710295, "ground_truth": 0}, {"key": "46102a68e2927f930c1c2bd117ca714d188cd1ab", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.5448014101062287, "ground_truth": 0}, {"key": "ee6568a8880e61a498aab80c41f70939d567c991", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.2782567928315752, "ground_truth": 0}, {"key": "ee6568a8880e61a498aab80c41f70939d567c991", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.40356686511583484, "ground_truth": 0}, {"key": "ee6568a8880e61a498aab80c41f70939d567c991", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.16559312400565493, "ground_truth": 0}, {"key": "ee6568a8880e61a498aab80c41f70939d567c991", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.24508501077646958, "ground_truth": 0}, {"key": "ee6568a8880e61a498aab80c41f70939d567c991", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.32939172608940687, "ground_truth": 0}, {"key": "8f462be265750ebbf85a6ad8ef28cb39c59f826e", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.3433417404524477, "ground_truth": 0}, {"key": "8f462be265750ebbf85a6ad8ef28cb39c59f826e", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.6206216099309146, "ground_truth": 0}, {"key": "8f462be265750ebbf85a6ad8ef28cb39c59f826e", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.5698526556240805, "ground_truth": 0}, {"key": "8f462be265750ebbf85a6ad8ef28cb39c59f826e", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.5350984389693259, "ground_truth": 0}, {"key": "8f462be265750ebbf85a6ad8ef28cb39c59f826e", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.44360042076426487, "ground_truth": 0}, {"key": "b21258342db561f79656c3c75f2e8c8244dd6178", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.6688802536295946, "ground_truth": 0}, {"key": "b21258342db561f79656c3c75f2e8c8244dd6178", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.6460137045636204, "ground_truth": 0}, {"key": "b21258342db561f79656c3c75f2e8c8244dd6178", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.6279512146332661, "ground_truth": 0}, {"key": "b21258342db561f79656c3c75f2e8c8244dd6178", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.6406358231765111, "ground_truth": 0}, {"key": "b21258342db561f79656c3c75f2e8c8244dd6178", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.7401743550893852, "ground_truth": 0}, {"key": "c7b97c7c2ca7b9bedff4978dd3cae9aaef8f8100", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.5869964460302748, "ground_truth": 0}, {"key": "c7b97c7c2ca7b9bedff4978dd3cae9aaef8f8100", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.47268347026774515, "ground_truth": 0}, {"key": "c7b97c7c2ca7b9bedff4978dd3cae9aaef8f8100", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.5389832532301048, "ground_truth": 0}, {"key": "c7b97c7c2ca7b9bedff4978dd3cae9aaef8f8100", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.7431680145800421, "ground_truth": 0}, {"key": "c7b97c7c2ca7b9bedff4978dd3cae9aaef8f8100", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.542863286920058, "ground_truth": 0}, {"key": "bdbeb9265050f2a4ce200c3802775694b7dc20e6", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.5097643816666438, "ground_truth": 0}, {"key": "bdbeb9265050f2a4ce200c3802775694b7dc20e6", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.7745833987377908, "ground_truth": 0}, {"key": "bdbeb9265050f2a4ce200c3802775694b7dc20e6", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.6406358395861808, "ground_truth": 0}, {"key": "bdbeb9265050f2a4ce200c3802775694b7dc20e6", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.5563995460776789, "ground_truth": 0}, {"key": "bdbeb9265050f2a4ce200c3802775694b7dc20e6", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.5486734933447829, "ground_truth": 0}, {"key": "42e93d5aef7547b8169f1f6c7735d0265a030580", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.7839884856047972, "ground_truth": 0}, {"key": "42e93d5aef7547b8169f1f6c7735d0265a030580", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.6334102804437088, "ground_truth": 0}, {"key": "42e93d5aef7547b8169f1f6c7735d0265a030580", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.6774740103441476, "ground_truth": 0}, {"key": "42e93d5aef7547b8169f1f6c7735d0265a030580", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.5312093634484316, "ground_truth": 0}, {"key": "42e93d5aef7547b8169f1f6c7735d0265a030580", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.6757646079090737, "ground_truth": 0}, {"key": "6e7a607934780f0011aa4e84509314efe15c2685", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.7520125628266244, "ground_truth": 0}, {"key": "6e7a607934780f0011aa4e84509314efe15c2685", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.624293537036768, "ground_truth": 0}, {"key": "6e7a607934780f0011aa4e84509314efe15c2685", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.7138307684255257, "ground_truth": 0}, {"key": "6e7a607934780f0011aa4e84509314efe15c2685", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.5869964483209605, "ground_truth": 0}, {"key": "6e7a607934780f0011aa4e84509314efe15c2685", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.633410255915603, "ground_truth": 0}, {"key": "c087e2af172aed145b177c9a1a68029205bc732a", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.6513548637538249, "ground_truth": 0}, {"key": "c087e2af172aed145b177c9a1a68029205bc732a", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.45713671784248955, "ground_truth": 0}, {"key": "c087e2af172aed145b177c9a1a68029205bc732a", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.32252599046322444, "ground_truth": 0}, {"key": "c087e2af172aed145b177c9a1a68029205bc732a", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.5869964171298684, "ground_truth": 0}, {"key": "c087e2af172aed145b177c9a1a68029205bc732a", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.794384959862017, "ground_truth": 0}, {"key": "40e79de5b7a27d7161b147725936d1d47e45c8f9", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.8879840582506594, "ground_truth": 0}, {"key": "40e79de5b7a27d7161b147725936d1d47e45c8f9", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.8322366352552459, "ground_truth": 0}, {"key": "40e79de5b7a27d7161b147725936d1d47e45c8f9", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.7799928998533873, "ground_truth": 0}, {"key": "40e79de5b7a27d7161b147725936d1d47e45c8f9", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.8116760181579129, "ground_truth": 0}, {"key": "40e79de5b7a27d7161b147725936d1d47e45c8f9", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.7892336920593809, "ground_truth": 0}, {"key": "e878909ace599352d3d578796968bbd52cb299bd", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.32766831247658856, "ground_truth": 0}, {"key": "e878909ace599352d3d578796968bbd52cb299bd", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.33285233529134145, "ground_truth": 0}, {"key": "e878909ace599352d3d578796968bbd52cb299bd", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.44939263473645963, "ground_truth": 0}, {"key": "e878909ace599352d3d578796968bbd52cb299bd", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.3575675461570447, "ground_truth": 0}, {"key": "e878909ace599352d3d578796968bbd52cb299bd", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.4707366084733767, "ground_truth": 0}, {"key": "470708aab0fe600a27423bf4a2f8c9860fe5f64b", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.6619228698341725, "ground_truth": 0}, {"key": "470708aab0fe600a27423bf4a2f8c9860fe5f64b", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.6654105714947435, "ground_truth": 0}, {"key": "470708aab0fe600a27423bf4a2f8c9860fe5f64b", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.492188119593331, "ground_truth": 0}, {"key": "470708aab0fe600a27423bf4a2f8c9860fe5f64b", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.5253688203512825, "ground_truth": 0}, {"key": "470708aab0fe600a27423bf4a2f8c9860fe5f64b", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.8558511528814396, "ground_truth": 0}, {"key": "16e8cb520c874af6825d4661f6127a67efd4b6f6", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.7201714850137948, "ground_truth": 0}, {"key": "16e8cb520c874af6825d4661f6127a67efd4b6f6", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.5907791975007689, "ground_truth": 0}, {"key": "16e8cb520c874af6825d4661f6127a67efd4b6f6", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.7185944023057219, "ground_truth": 0}, {"key": "16e8cb520c874af6825d4661f6127a67efd4b6f6", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.552539727312695, "ground_truth": 0}, {"key": "16e8cb520c874af6825d4661f6127a67efd4b6f6", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.6740504746671051, "ground_truth": 0}, {"key": "38673348ff28676905791fe3e8db2bbda814d974", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.3942009343841429, "ground_truth": 0}, {"key": "38673348ff28676905791fe3e8db2bbda814d974", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.5019531300256541, "ground_truth": 0}, {"key": "38673348ff28676905791fe3e8db2bbda814d974", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.6740504727161524, "ground_truth": 0}, {"key": "38673348ff28676905791fe3e8db2bbda814d974", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.620621599790726, "ground_truth": 0}, {"key": "38673348ff28676905791fe3e8db2bbda814d974", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.25534365830050026, "ground_truth": 0}, {"key": "914a0163e25ecccb635b601837cc4dd552c66ce0", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.45132651468403245, "ground_truth": 0}, {"key": "914a0163e25ecccb635b601837cc4dd552c66ce0", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.34864514271910085, "ground_truth": 0}, {"key": "914a0163e25ecccb635b601837cc4dd552c66ce0", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.24798743732921016, "ground_truth": 0}, {"key": "914a0163e25ecccb635b601837cc4dd552c66ce0", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.23510837526790299, "ground_truth": 0}, {"key": "914a0163e25ecccb635b601837cc4dd552c66ce0", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.47463116287568957, "ground_truth": 0}, {"key": "851c7314af56b6f47742970e11696948323dfe94", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.7106283119969667, "ground_truth": 0}, {"key": "851c7314af56b6f47742970e11696948323dfe94", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.8606036095071282, "ground_truth": 0}, {"key": "851c7314af56b6f47742970e11696948323dfe94", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.8210441065318251, "ground_truth": 0}, {"key": "851c7314af56b6f47742970e11696948323dfe94", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.6943026828118499, "ground_truth": 0}, {"key": "851c7314af56b6f47742970e11696948323dfe94", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.7356416441912934, "ground_truth": 0}, {"key": "f29f04e8f0615b768dd756c4387e87e27b7b4c2d", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.4707366038309446, "ground_truth": 0}, {"key": "f29f04e8f0615b768dd756c4387e87e27b7b4c2d", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.40922080072036054, "ground_truth": 0}, {"key": "f29f04e8f0615b768dd756c4387e87e27b7b4c2d", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.34687309011482176, "ground_truth": 0}, {"key": "f29f04e8f0615b768dd756c4387e87e27b7b4c2d", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.4902356304044594, "ground_truth": 0}, {"key": "f29f04e8f0615b768dd756c4387e87e27b7b4c2d", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.16451645840038467, "ground_truth": 0}, {"key": "8451164e86012e6dbf2fd39f7e6ca784ff9f3624", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.8766343857391976, "ground_truth": 0}, {"key": "8451164e86012e6dbf2fd39f7e6ca784ff9f3624", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.9173026568169822, "ground_truth": 0}, {"key": "8451164e86012e6dbf2fd39f7e6ca784ff9f3624", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.7490872126168697, "ground_truth": 0}, {"key": "8451164e86012e6dbf2fd39f7e6ca784ff9f3624", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.81405280598466, "ground_truth": 0}, {"key": "8451164e86012e6dbf2fd39f7e6ca784ff9f3624", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.8740772420720327, "ground_truth": 0}, {"key": "18765fda59852b1c13eb226a2da9ab0979739f44", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.7310585570620953, "ground_truth": 0}, {"key": "18765fda59852b1c13eb226a2da9ab0979739f44", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.9046505409297627, "ground_truth": 0}, {"key": "18765fda59852b1c13eb226a2da9ab0979739f44", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.8856314701864636, "ground_truth": 0}, {"key": "18765fda59852b1c13eb226a2da9ab0979739f44", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.9161096130985469, "ground_truth": 0}, {"key": "18765fda59852b1c13eb226a2da9ab0979739f44", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.8902942279908586, "ground_truth": 0}, {"key": "fba410776268aaf447802e66ac94e4af54f7cb7a", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.9304582531521852, "ground_truth": 0}, {"key": "fba410776268aaf447802e66ac94e4af54f7cb7a", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.9202179860617707, "ground_truth": 0}, {"key": "fba410776268aaf447802e66ac94e4af54f7cb7a", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.8311430420092548, "ground_truth": 0}, {"key": "fba410776268aaf447802e66ac94e4af54f7cb7a", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.9362850028239197, "ground_truth": 0}, {"key": "fba410776268aaf447802e66ac94e4af54f7cb7a", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.8365545664682701, "ground_truth": 0}, {"key": "31494e5d6eda2042c4793ae68cea4b8304dfa0ad", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.8019358278350608, "ground_truth": 0}, {"key": "31494e5d6eda2042c4793ae68cea4b8304dfa0ad", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.9372107956419574, "ground_truth": 0}, {"key": "31494e5d6eda2042c4793ae68cea4b8304dfa0ad", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.9142907181763562, "ground_truth": 0}, {"key": "31494e5d6eda2042c4793ae68cea4b8304dfa0ad", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.9284087944618862, "ground_truth": 0}, {"key": "31494e5d6eda2042c4793ae68cea4b8304dfa0ad", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.9433475745990269, "ground_truth": 0}, {"key": "564bdb9bbcd2276bdfbdce6eb1e2058f0921bd82", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.6584175138548758, "ground_truth": 0}, {"key": "564bdb9bbcd2276bdfbdce6eb1e2058f0921bd82", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.7892336863647349, "ground_truth": 0}, {"key": "564bdb9bbcd2276bdfbdce6eb1e2058f0921bd82", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.6976089056815019, "ground_truth": 0}, {"key": "564bdb9bbcd2276bdfbdce6eb1e2058f0921bd82", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.4263216034452336, "ground_truth": 0}, {"key": "564bdb9bbcd2276bdfbdce6eb1e2058f0921bd82", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.8221891159856551, "ground_truth": 0}, {"key": "acbacec078274c02aeae06061357d02d950fec33", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.8311430446004928, "ground_truth": 0}, {"key": "acbacec078274c02aeae06061357d02d950fec33", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.8221891216274716, "ground_truth": 0}, {"key": "acbacec078274c02aeae06061357d02d950fec33", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.8606036239875064, "ground_truth": 0}, {"key": "acbacec078274c02aeae06061357d02d950fec33", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.8397339727755696, "ground_truth": 0}, {"key": "acbacec078274c02aeae06061357d02d950fec33", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.7969253748250668, "ground_truth": 0}, {"key": "04327bc3e426eee01ed61d369fd52415aa300ddc", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.6825737333055557, "ground_truth": 0}, {"key": "04327bc3e426eee01ed61d369fd52415aa300ddc", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.40544876610992314, "ground_truth": 0}, {"key": "04327bc3e426eee01ed61d369fd52415aa300ddc", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.7905303267206426, "ground_truth": 0}, {"key": "04327bc3e426eee01ed61d369fd52415aa300ddc", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.5698526434297232, "ground_truth": 0}, {"key": "04327bc3e426eee01ed61d369fd52415aa300ddc", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.5409238582207845, "ground_truth": 0}, {"key": "b1f3d2adb48370e5ecadff8e6e3baff407b01f0e", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.8386797554466997, "ground_truth": 0}, {"key": "b1f3d2adb48370e5ecadff8e6e3baff407b01f0e", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.6315942870835429, "ground_truth": 0}, {"key": "b1f3d2adb48370e5ecadff8e6e3baff407b01f0e", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.7446563448399015, "ground_truth": 0}, {"key": "b1f3d2adb48370e5ecadff8e6e3baff407b01f0e", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.6859494496640036, "ground_truth": 0}, {"key": "b1f3d2adb48370e5ecadff8e6e3baff407b01f0e", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.6352224220389099, "ground_truth": 0}, {"key": "d7eaf2e5ca91bf54c05ead867e5e90728d44e218", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.8991213856956043, "ground_truth": 0}, {"key": "d7eaf2e5ca91bf54c05ead867e5e90728d44e218", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.7969253637094534, "ground_truth": 0}, {"key": "d7eaf2e5ca91bf54c05ead867e5e90728d44e218", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.9294403998261266, "ground_truth": 0}, {"key": "d7eaf2e5ca91bf54c05ead867e5e90728d44e218", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.8006919933890562, "ground_truth": 0}, {"key": "d7eaf2e5ca91bf54c05ead867e5e90728d44e218", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.7386690761923908, "ground_truth": 0}, {"key": "1fcce9f667de2a14d76aaa6cdb3f1e6f7900e463", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.9623913641306607, "ground_truth": 0}, {"key": "1fcce9f667de2a14d76aaa6cdb3f1e6f7900e463", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.9353465128181655, "ground_truth": 0}, {"key": "1fcce9f667de2a14d76aaa6cdb3f1e6f7900e463", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.9161096138401639, "ground_truth": 0}, {"key": "1fcce9f667de2a14d76aaa6cdb3f1e6f7900e463", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.8766343908308157, "ground_truth": 0}, {"key": "1fcce9f667de2a14d76aaa6cdb3f1e6f7900e463", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.845942433140491, "ground_truth": 0}, {"key": "892f75a4d31560b60aa588faa6f4bf51322b8c18", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.8128673201421898, "ground_truth": 0}, {"key": "892f75a4d31560b60aa588faa6f4bf51322b8c18", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.8840392791020445, "ground_truth": 0}, {"key": "892f75a4d31560b60aa588faa6f4bf51322b8c18", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.8925625309967901, "ground_truth": 0}, {"key": "892f75a4d31560b60aa588faa6f4bf51322b8c18", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.7606506513653098, "ground_truth": 0}, {"key": "892f75a4d31560b60aa588faa6f4bf51322b8c18", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.8872045973384547, "ground_truth": 0}, {"key": "acf12bd8d1142648b1b522a3a925e14e48b8f068", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.8548846425278667, "ground_truth": 0}, {"key": "acf12bd8d1142648b1b522a3a925e14e48b8f068", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.65665824950745, "ground_truth": 0}, {"key": "acf12bd8d1142648b1b522a3a925e14e48b8f068", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.5717666027017206, "ground_truth": 0}, {"key": "acf12bd8d1142648b1b522a3a925e14e48b8f068", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.5983122199180758, "ground_truth": 0}, {"key": "acf12bd8d1142648b1b522a3a925e14e48b8f068", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.7057850327561447, "ground_truth": 0}, {"key": "c8caeb08b05cc56e1ac29146793ceb07e4c0de69", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.8539127490370364, "ground_truth": 0}, {"key": "c8caeb08b05cc56e1ac29146793ceb07e4c0de69", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.5832033569923474, "ground_truth": 0}, {"key": "c8caeb08b05cc56e1ac29146793ceb07e4c0de69", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.8044059288352817, "ground_truth": 0}, {"key": "c8caeb08b05cc56e1ac29146793ceb07e4c0de69", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.6774740010677195, "ground_truth": 0}, {"key": "c8caeb08b05cc56e1ac29146793ceb07e4c0de69", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.6774740023581498, "ground_truth": 0}, {"key": "ed7ed4440f5f7082230ae745d240350a4f20b8b7", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.5888891169695696, "ground_truth": 0}, {"key": "ed7ed4440f5f7082230ae745d240350a4f20b8b7", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.6548947178883716, "ground_truth": 0}, {"key": "ed7ed4440f5f7082230ae745d240350a4f20b8b7", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.6297745794219926, "ground_truth": 0}, {"key": "ed7ed4440f5f7082230ae745d240350a4f20b8b7", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.5428632604784386, "ground_truth": 0}, {"key": "ed7ed4440f5f7082230ae745d240350a4f20b8b7", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.5945512707713991, "ground_truth": 0}, {"key": "25b7adf8bfe43c2953a874b18c7766370158638a", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.4921881246988709, "ground_truth": 0}, {"key": "25b7adf8bfe43c2953a874b18c7766370158638a", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.7057850377130948, "ground_truth": 0}, {"key": "25b7adf8bfe43c2953a874b18c7766370158638a", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.38861801876838786, "ground_truth": 0}, {"key": "25b7adf8bfe43c2953a874b18c7766370158638a", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.6297746103692566, "ground_truth": 0}, {"key": "25b7adf8bfe43c2953a874b18c7766370158638a", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.8428631476317262, "ground_truth": 0}, {"key": "771c125e3b0c54f1c3367b2857f15d689f081163", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.661922873872293, "ground_truth": 0}, {"key": "771c125e3b0c54f1c3367b2857f15d689f081163", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.8031737791291323, "ground_truth": 0}, {"key": "771c125e3b0c54f1c3367b2857f15d689f081163", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.6460137106380213, "ground_truth": 0}, {"key": "771c125e3b0c54f1c3367b2857f15d689f081163", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.8449215390077868, "ground_truth": 0}, {"key": "771c125e3b0c54f1c3367b2857f15d689f081163", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.7931059458112727, "ground_truth": 0}, {"key": "4ad70f84c363e5b594da00983e2b40600f12ca54", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.7264256160867101, "ground_truth": 0}, {"key": "4ad70f84c363e5b594da00983e2b40600f12ca54", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.685949475296023, "ground_truth": 0}, {"key": "4ad70f84c363e5b594da00983e2b40600f12ca54", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.5195213344258702, "ground_truth": 0}, {"key": "4ad70f84c363e5b594da00983e2b40600f12ca54", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.8031738064314422, "ground_truth": 0}, {"key": "4ad70f84c363e5b594da00983e2b40600f12ca54", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.8221891415384253, "ground_truth": 0}, {"key": "cbb5654e979eb27e0af71068cd4e4e5191df35ee", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.6001883585126683, "ground_truth": 0}, {"key": "cbb5654e979eb27e0af71068cd4e4e5191df35ee", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.6943026762420382, "ground_truth": 0}, {"key": "cbb5654e979eb27e0af71068cd4e4e5191df35ee", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.5832033678789775, "ground_truth": 0}, {"key": "cbb5654e979eb27e0af71068cd4e4e5191df35ee", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.6315943031133872, "ground_truth": 0}, {"key": "cbb5654e979eb27e0af71068cd4e4e5191df35ee", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.5602526486149767, "ground_truth": 0}, {"key": "bde6b7e505c05a15a9afe44739e7f016ce169735", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.2005576806910618, "ground_truth": 0}, {"key": "bde6b7e505c05a15a9afe44739e7f016ce169735", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.1623800365104143, "ground_truth": 0}, {"key": "bde6b7e505c05a15a9afe44739e7f016ce169735", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.2829881337976982, "ground_truth": 0}, {"key": "bde6b7e505c05a15a9afe44739e7f016ce169735", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.16776333722035752, "ground_truth": 0}, {"key": "bde6b7e505c05a15a9afe44739e7f016ce169735", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.6370308312079802, "ground_truth": 0}, {"key": "abc4744227c6bf0ddbf64cac2269bd4c6d02938b", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.2509127976815287, "ground_truth": 0}, {"key": "abc4744227c6bf0ddbf64cac2269bd4c6d02938b", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.29746993096790963, "ground_truth": 0}, {"key": "abc4744227c6bf0ddbf64cac2269bd4c6d02938b", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.3468730960830134, "ground_truth": 0}, {"key": "abc4744227c6bf0ddbf64cac2269bd4c6d02938b", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.41869690005863147, "ground_truth": 0}, {"key": "abc4744227c6bf0ddbf64cac2269bd4c6d02938b", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.35936412705761167, "ground_truth": 0}, {"key": "f7e5e75031e9f099564ed046bd822ef1bedb3188", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.5058591144596315, "ground_truth": 0}, {"key": "f7e5e75031e9f099564ed046bd822ef1bedb3188", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.6224593167604376, "ground_truth": 0}, {"key": "f7e5e75031e9f099564ed046bd822ef1bedb3188", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.6688802637247309, "ground_truth": 0}, {"key": "f7e5e75031e9f099564ed046bd822ef1bedb3188", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.7122321631265535, "ground_truth": 0}, {"key": "f7e5e75031e9f099564ed046bd822ef1bedb3188", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.6548947349139883, "ground_truth": 0}, {"key": "9a8ee7eb582f293c617eecab5f37374d9400bb04", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.5544704791041023, "ground_truth": 0}, {"key": "9a8ee7eb582f293c617eecab5f37374d9400bb04", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.2568319970977626, "ground_truth": 0}, {"key": "9a8ee7eb582f293c617eecab5f37374d9400bb04", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.5370413948276329, "ground_truth": 0}, {"key": "9a8ee7eb582f293c617eecab5f37374d9400bb04", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.26588047653904756, "ground_truth": 0}, {"key": "9a8ee7eb582f293c617eecab5f37374d9400bb04", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.6791786853393805, "ground_truth": 0}, {"key": "a745e5a95be983cde00f3d472062c0627db3113c", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.3611647381404185, "ground_truth": 0}, {"key": "a745e5a95be983cde00f3d472062c0627db3113c", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.5136684833304495, "ground_truth": 0}, {"key": "a745e5a95be983cde00f3d472062c0627db3113c", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.45132652889551733, "ground_truth": 0}, {"key": "a745e5a95be983cde00f3d472062c0627db3113c", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.5117165965415328, "ground_truth": 0}, {"key": "a745e5a95be983cde00f3d472062c0627db3113c", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.40168784492826803, "ground_truth": 0}, {"key": "698cdb1268d4da1240d7f540bd4a5af4e229d00f", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.8080672156424551, "ground_truth": 0}, {"key": "698cdb1268d4da1240d7f540bd4a5af4e229d00f", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.757794361261379, "ground_truth": 0}, {"key": "698cdb1268d4da1240d7f540bd4a5af4e229d00f", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.5583270037135574, "ground_truth": 0}, {"key": "698cdb1268d4da1240d7f540bd4a5af4e229d00f", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.6791787069881496, "ground_truth": 0}, {"key": "698cdb1268d4da1240d7f540bd4a5af4e229d00f", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.7074046815931492, "ground_truth": 0}, {"key": "708c903fbf6a7c3c84f84ff34496eb0cb51f44e4", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.6495786502248357, "ground_truth": 0}, {"key": "708c903fbf6a7c3c84f84ff34496eb0cb51f44e4", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.5039061694546664, "ground_truth": 0}, {"key": "708c903fbf6a7c3c84f84ff34496eb0cb51f44e4", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.9167080740679908, "ground_truth": 0}, {"key": "708c903fbf6a7c3c84f84ff34496eb0cb51f44e4", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.6909762995261894, "ground_truth": 0}, {"key": "708c903fbf6a7c3c84f84ff34496eb0cb51f44e4", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.699254415883295, "ground_truth": 0}, {"key": "26a1bafbde5cc970d5aee024dc8ef418587018a9", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.5506073707697136, "ground_truth": 0}, {"key": "26a1bafbde5cc970d5aee024dc8ef418587018a9", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.6584174914112525, "ground_truth": 0}, {"key": "26a1bafbde5cc970d5aee024dc8ef418587018a9", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.5832033501563637, "ground_truth": 0}, {"key": "26a1bafbde5cc970d5aee024dc8ef418587018a9", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.6460136888760073, "ground_truth": 0}, {"key": "26a1bafbde5cc970d5aee024dc8ef418587018a9", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.7325918519046044, "ground_truth": 0}, {"key": "6832312991fe5d87d0e300374ec7a699a921f06a", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.4130035762016072, "ground_truth": 0}, {"key": "6832312991fe5d87d0e300374ec7a699a921f06a", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.5331543862969226, "ground_truth": 0}, {"key": "6832312991fe5d87d0e300374ec7a699a921f06a", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.35220177763376914, "ground_truth": 0}, {"key": "6832312991fe5d87d0e300374ec7a699a921f06a", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.5583269794283812, "ground_truth": 0}, {"key": "6832312991fe5d87d0e300374ec7a699a921f06a", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.6584175015938749, "ground_truth": 0}, {"key": "9c5d5d672c2549a594b801897a27dde1492e11d5", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.712232176113993, "ground_truth": 0}, {"key": "9c5d5d672c2549a594b801897a27dde1492e11d5", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.6513548499253655, "ground_truth": 0}, {"key": "9c5d5d672c2549a594b801897a27dde1492e11d5", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.6113819841881691, "ground_truth": 0}, {"key": "9c5d5d672c2549a594b801897a27dde1492e11d5", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.635222450555136, "ground_truth": 0}, {"key": "9c5d5d672c2549a594b801897a27dde1492e11d5", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.5679365854261126, "ground_truth": 0}, {"key": "c32fa9084fe8cd565890a940794e505d5f7ba4c2", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.7217432116199399, "ground_truth": 0}, {"key": "c32fa9084fe8cd565890a940794e505d5f7ba4c2", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.7279754442059255, "ground_truth": 0}, {"key": "c32fa9084fe8cd565890a940794e505d5f7ba4c2", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.7401743836219652, "ground_truth": 0}, {"key": "c32fa9084fe8cd565890a940794e505d5f7ba4c2", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.531209379357454, "ground_truth": 0}, {"key": "c32fa9084fe8cd565890a940794e505d5f7ba4c2", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.34334173886238956, "ground_truth": 0}, {"key": "41b5dd6064864c16fbde9b46d37c9f7d9a56e705", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.5563995444406787, "ground_truth": 0}, {"key": "41b5dd6064864c16fbde9b46d37c9f7d9a56e705", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.7416740296129123, "ground_truth": 0}, {"key": "41b5dd6064864c16fbde9b46d37c9f7d9a56e705", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.5486734975065132, "ground_truth": 0}, {"key": "41b5dd6064864c16fbde9b46d37c9f7d9a56e705", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.4960938160045089, "ground_truth": 0}, {"key": "41b5dd6064864c16fbde9b46d37c9f7d9a56e705", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.5136684519304382, "ground_truth": 0}, {"key": "b2d3ba739af767da7aa25c3ba8e1d186168c3394", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.9399133520970572, "ground_truth": 0}, {"key": "b2d3ba739af767da7aa25c3ba8e1d186168c3394", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.9252299519928414, "ground_truth": 0}, {"key": "b2d3ba739af767da7aa25c3ba8e1d186168c3394", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.8799743625391478, "ground_truth": 0}, {"key": "b2d3ba739af767da7aa25c3ba8e1d186168c3394", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.9263037237922073, "ground_truth": 0}, {"key": "b2d3ba739af767da7aa25c3ba8e1d186168c3394", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.9489172620334153, "ground_truth": 0}, {"key": "519fd9b5c5ca82979cdfee3c990c3590838d93c7", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.4551985854804103, "ground_truth": 0}, {"key": "519fd9b5c5ca82979cdfee3c990c3590838d93c7", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.7969253669754796, "ground_truth": 0}, {"key": "519fd9b5c5ca82979cdfee3c990c3590838d93c7", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.2509127879847708, "ground_truth": 0}, {"key": "519fd9b5c5ca82979cdfee3c990c3590838d93c7", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.5331544034831871, "ground_truth": 0}, {"key": "519fd9b5c5ca82979cdfee3c990c3590838d93c7", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.46490156077889266, "ground_truth": 0}, {"key": "60f518dff20b2936b104035b1fd9584dd7d16def", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.5869964307085963, "ground_truth": 0}, {"key": "60f518dff20b2936b104035b1fd9584dd7d16def", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.687630002081477, "ground_truth": 0}, {"key": "60f518dff20b2936b104035b1fd9584dd7d16def", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.4610167841686298, "ground_truth": 0}, {"key": "60f518dff20b2936b104035b1fd9584dd7d16def", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.6315943179791441, "ground_truth": 0}, {"key": "60f518dff20b2936b104035b1fd9584dd7d16def", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.5350983991037469, "ground_truth": 0}, {"key": "b82546b760716f0a2b26606b07af0fe0dd61d6ff", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.38861805054443743, "ground_truth": 0}, {"key": "b82546b760716f0a2b26606b07af0fe0dd61d6ff", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.30569731315652726, "ground_truth": 0}, {"key": "b82546b760716f0a2b26606b07af0fe0dd61d6ff", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.40168781676287235, "ground_truth": 0}, {"key": "b82546b760716f0a2b26606b07af0fe0dd61d6ff", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.275129701901707, "ground_truth": 0}, {"key": "b82546b760716f0a2b26606b07af0fe0dd61d6ff", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.48047868318609593, "ground_truth": 0}, {"key": "7990fde4a924299fab79f6c8e2b447ee5ffcd1fc", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.28616925234584367, "ground_truth": 0}, {"key": "7990fde4a924299fab79f6c8e2b447ee5ffcd1fc", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.1384617842406793, "ground_truth": 0}, {"key": "7990fde4a924299fab79f6c8e2b447ee5ffcd1fc", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.12506538337460515, "ground_truth": 0}, {"key": "7990fde4a924299fab79f6c8e2b447ee5ffcd1fc", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.35936414692880075, "ground_truth": 0}, {"key": "7990fde4a924299fab79f6c8e2b447ee5ffcd1fc", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.4225046248743459, "ground_truth": 0}, {"key": "504f6f6e1aea6bb73c728d12a1342faa6828aace", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.9946981052090117, "ground_truth": 0}, {"key": "504f6f6e1aea6bb73c728d12a1342faa6828aace", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.9956346740866554, "ground_truth": 0}, {"key": "504f6f6e1aea6bb73c728d12a1342faa6828aace", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.9946567441717392, "ground_truth": 0}, {"key": "504f6f6e1aea6bb73c728d12a1342faa6828aace", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.9843363515092132, "ground_truth": 0}, {"key": "504f6f6e1aea6bb73c728d12a1342faa6828aace", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.9924227590075678, "ground_truth": 0}, {"key": "ef42653bf9337de184e74be0160b807a41b526fd", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.9882221562424728, "ground_truth": 0}, {"key": "ef42653bf9337de184e74be0160b807a41b526fd", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.9923043526323752, "ground_truth": 0}, {"key": "ef42653bf9337de184e74be0160b807a41b526fd", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.9843363508779387, "ground_truth": 0}, {"key": "ef42653bf9337de184e74be0160b807a41b526fd", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.9871787857551508, "ground_truth": 0}, {"key": "ef42653bf9337de184e74be0160b807a41b526fd", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.9904405998647289, "ground_truth": 0}, {"key": "26d0a5624f3ee7605833c641da5d88e2259b1162", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.4726834810568978, "ground_truth": 0}, {"key": "26d0a5624f3ee7605833c641da5d88e2259b1162", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.4707366181983804, "ground_truth": 0}, {"key": "26d0a5624f3ee7605833c641da5d88e2259b1162", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.6671476596026478, "ground_truth": 0}, {"key": "26d0a5624f3ee7605833c641da5d88e2259b1162", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.5389832132741388, "ground_truth": 0}, {"key": "26d0a5624f3ee7605833c641da5d88e2259b1162", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.5525396988083626, "ground_truth": 0}, {"key": "7e43e9a2c67829721ff9f68147285c579e2c8a70", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.39606816604363415, "ground_truth": 0}, {"key": "7e43e9a2c67829721ff9f68147285c579e2c8a70", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.47852885115686256, "ground_truth": 0}, {"key": "7e43e9a2c67829721ff9f68147285c579e2c8a70", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.3056973403624073, "ground_truth": 0}, {"key": "7e43e9a2c67829721ff9f68147285c579e2c8a70", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.28457600733639, "ground_truth": 0}, {"key": "7e43e9a2c67829721ff9f68147285c579e2c8a70", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.48828339357478584, "ground_truth": 0}, {"key": "2137ee3e39b5c0d12e17bbd1e10eb75495a3a83b", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.14706452975370518, "ground_truth": 0}, {"key": "2137ee3e39b5c0d12e17bbd1e10eb75495a3a83b", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.22270014430697233, "ground_truth": 0}, {"key": "2137ee3e39b5c0d12e17bbd1e10eb75495a3a83b", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.1135795929765637, "ground_truth": 0}, {"key": "2137ee3e39b5c0d12e17bbd1e10eb75495a3a83b", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.042087727988212566, "ground_truth": 0}, {"key": "2137ee3e39b5c0d12e17bbd1e10eb75495a3a83b", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.1755380667646236, "ground_truth": 0}, {"key": "31defcc44013caae59c0bdbcedd16be150413bd5", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.6132365714293869, "ground_truth": 0}, {"key": "31defcc44013caae59c0bdbcedd16be150413bd5", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.5907792245738085, "ground_truth": 0}, {"key": "31defcc44013caae59c0bdbcedd16be150413bd5", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.7356416396829631, "ground_truth": 0}, {"key": "31defcc44013caae59c0bdbcedd16be150413bd5", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.7505527789130267, "ground_truth": 0}, {"key": "31defcc44013caae59c0bdbcedd16be150413bd5", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.6859494487273168, "ground_truth": 0}, {"key": "db73dc3466e4e92672d716c1eb2ac9430ac69951", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.8386797748542375, "ground_truth": 0}, {"key": "db73dc3466e4e92672d716c1eb2ac9430ac69951", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.8895288450291516, "ground_truth": 0}, {"key": "db73dc3466e4e92672d716c1eb2ac9430ac69951", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.8539127697716787, "ground_truth": 0}, {"key": "db73dc3466e4e92672d716c1eb2ac9430ac69951", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.8824278750521575, "ground_truth": 0}, {"key": "db73dc3466e4e92672d716c1eb2ac9430ac69951", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.7563575621503914, "ground_truth": 0}, {"key": "3f6308f2f5b6ccdb89d7b6abe1b9490cc30b8e5f", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.373875828181021, "ground_truth": 0}, {"key": "3f6308f2f5b6ccdb89d7b6abe1b9490cc30b8e5f", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.24508502011457256, "ground_truth": 0}, {"key": "3f6308f2f5b6ccdb89d7b6abe1b9490cc30b8e5f", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.334589456001123, "ground_truth": 0}, {"key": "3f6308f2f5b6ccdb89d7b6abe1b9490cc30b8e5f", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.3849121369238765, "ground_truth": 0}, {"key": "3f6308f2f5b6ccdb89d7b6abe1b9490cc30b8e5f", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.4416730253924061, "ground_truth": 0}, {"key": "068d37f7a1ee822245dbf9d0d8ddfc281919d7ee", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.4941408829278032, "ground_truth": 0}, {"key": "068d37f7a1ee822245dbf9d0d8ddfc281919d7ee", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.7431680191738693, "ground_truth": 0}, {"key": "068d37f7a1ee822245dbf9d0d8ddfc281919d7ee", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.49804689514416794, "ground_truth": 0}, {"key": "068d37f7a1ee822245dbf9d0d8ddfc281919d7ee", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.49023560385322557, "ground_truth": 0}, {"key": "068d37f7a1ee822245dbf9d0d8ddfc281919d7ee", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.746138976897883, "ground_truth": 0}, {"key": "bb1e2c23f3fc6edb0ee4bed365cb5567c87a5aa9", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.8749346164900375, "ground_truth": 0}, {"key": "bb1e2c23f3fc6edb0ee4bed365cb5567c87a5aa9", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.7931059430107392, "ground_truth": 0}, {"key": "bb1e2c23f3fc6edb0ee4bed365cb5567c87a5aa9", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.8558511395175713, "ground_truth": 0}, {"key": "bb1e2c23f3fc6edb0ee4bed365cb5567c87a5aa9", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.8068526200984936, "ground_truth": 0}, {"key": "bb1e2c23f3fc6edb0ee4bed365cb5567c87a5aa9", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.8824278637578449, "ground_truth": 0}, {"key": "7c72b57e65ddefc77362ed64f7dbc0aebb87ac81", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.952574126809996, "ground_truth": 0}, {"key": "7c72b57e65ddefc77362ed64f7dbc0aebb87ac81", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.9618217257947457, "ground_truth": 0}, {"key": "7c72b57e65ddefc77362ed64f7dbc0aebb87ac81", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.9559813494394466, "ground_truth": 0}, {"key": "7c72b57e65ddefc77362ed64f7dbc0aebb87ac81", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.9445872049315159, "ground_truth": 0}, {"key": "7c72b57e65ddefc77362ed64f7dbc0aebb87ac81", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.978874808433028, "ground_truth": 0}, {"key": "37a335b36b8d2472825c4624e5449b995726b7a3", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.443600437171725, "ground_truth": 0}, {"key": "37a335b36b8d2472825c4624e5449b995726b7a3", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.1655931151078417, "ground_truth": 0}, {"key": "37a335b36b8d2472825c4624e5449b995726b7a3", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.13206615575704297, "ground_truth": 0}, {"key": "37a335b36b8d2472825c4624e5449b995726b7a3", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.3942009580502685, "ground_truth": 0}, {"key": "37a335b36b8d2472825c4624e5449b995726b7a3", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.3611647122261808, "ground_truth": 0}, {"key": "da894eb6e5cc104f90ac65e8a124bfcfbfc6578d", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.39606815436432447, "ground_truth": 0}, {"key": "da894eb6e5cc104f90ac65e8a124bfcfbfc6578d", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.6566582662127474, "ground_truth": 0}, {"key": "da894eb6e5cc104f90ac65e8a124bfcfbfc6578d", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.3575675216353073, "ground_truth": 0}, {"key": "da894eb6e5cc104f90ac65e8a124bfcfbfc6578d", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.45907613932026636, "ground_truth": 0}, {"key": "da894eb6e5cc104f90ac65e8a124bfcfbfc6578d", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.26284185862452303, "ground_truth": 0}, {"key": "b7697e424512e656efe5f2aca17bc33cfe0a2b20", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.6943026776539589, "ground_truth": 0}, {"key": "b7697e424512e656efe5f2aca17bc33cfe0a2b20", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.482429098243751, "ground_truth": 0}, {"key": "b7697e424512e656efe5f2aca17bc33cfe0a2b20", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.6424324662248997, "ground_truth": 0}, {"key": "b7697e424512e656efe5f2aca17bc33cfe0a2b20", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.7401743654636648, "ground_truth": 0}, {"key": "b7697e424512e656efe5f2aca17bc33cfe0a2b20", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.6442251021151918, "ground_truth": 0}, {"key": "2292d4348e59aafbe93f3040af23fdff448a6cac", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.6654105448932097, "ground_truth": 0}, {"key": "2292d4348e59aafbe93f3040af23fdff448a6cac", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.6876299880254908, "ground_truth": 0}, {"key": "2292d4348e59aafbe93f3040af23fdff448a6cac", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.6774740362017371, "ground_truth": 0}, {"key": "2292d4348e59aafbe93f3040af23fdff448a6cac", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.5602526591048067, "ground_truth": 0}, {"key": "2292d4348e59aafbe93f3040af23fdff448a6cac", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.49218813668702216, "ground_truth": 0}, {"key": "8ed7e0c5e15275537f2c1d5d945e95709d7dc6bf", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.5813030885884406, "ground_truth": 0}, {"key": "8ed7e0c5e15275537f2c1d5d945e95709d7dc6bf", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.5660185216684438, "ground_truth": 0}, {"key": "8ed7e0c5e15275537f2c1d5d945e95709d7dc6bf", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.6477982268499913, "ground_truth": 0}, {"key": "8ed7e0c5e15275537f2c1d5d945e95709d7dc6bf", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.6388352724218104, "ground_truth": 0}, {"key": "8ed7e0c5e15275537f2c1d5d945e95709d7dc6bf", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.6477982181623855, "ground_truth": 0}, {"key": "6b22be31a2cefb2fdd302b8ff788335f23f5dbad", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.6187804228101998, "ground_truth": 0}, {"key": "6b22be31a2cefb2fdd302b8ff788335f23f5dbad", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.538983220509132, "ground_truth": 0}, {"key": "6b22be31a2cefb2fdd302b8ff788335f23f5dbad", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.49023562239887103, "ground_truth": 0}, {"key": "6b22be31a2cefb2fdd302b8ff788335f23f5dbad", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.5312093666728452, "ground_truth": 0}, {"key": "6b22be31a2cefb2fdd302b8ff788335f23f5dbad", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.451326528860611, "ground_truth": 0}, {"key": "686caba1039a286aca406e0bbac00aebb198fda5", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.7057850408572843, "ground_truth": 0}, {"key": "686caba1039a286aca406e0bbac00aebb198fda5", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.60766318369102, "ground_truth": 0}, {"key": "686caba1039a286aca406e0bbac00aebb198fda5", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.6723316970272383, "ground_truth": 0}, {"key": "686caba1039a286aca406e0bbac00aebb198fda5", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.675764565419438, "ground_truth": 0}, {"key": "686caba1039a286aca406e0bbac00aebb198fda5", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.6279512085117053, "ground_truth": 0}, {"key": "3c84e13d5941fdbe626183cdf1dca9b5df6c8f92", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.7248702797876415, "ground_truth": 0}, {"key": "3c84e13d5941fdbe626183cdf1dca9b5df6c8f92", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.7074047181151697, "ground_truth": 0}, {"key": "3c84e13d5941fdbe626183cdf1dca9b5df6c8f92", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.9124361604075543, "ground_truth": 0}, {"key": "3c84e13d5941fdbe626183cdf1dca9b5df6c8f92", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.9477691446839444, "ground_truth": 0}, {"key": "3c84e13d5941fdbe626183cdf1dca9b5df6c8f92", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.7325918535396645, "ground_truth": 0}, {"key": "7f5fd7614f32586747f65545bebba418c3679d12", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.5851011479161156, "ground_truth": 0}, {"key": "7f5fd7614f32586747f65545bebba418c3679d12", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.7931059577792295, "ground_truth": 0}, {"key": "7f5fd7614f32586747f65545bebba418c3679d12", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.6424324512957751, "ground_truth": 0}, {"key": "7f5fd7614f32586747f65545bebba418c3679d12", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.4629586137438396, "ground_truth": 0}, {"key": "7f5fd7614f32586747f65545bebba418c3679d12", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.7416740054859903, "ground_truth": 0}, {"key": "186210bbc060c272ff9a2412ec2e711a3e4a5e6e", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.5195213044437293, "ground_truth": 0}, {"key": "186210bbc060c272ff9a2412ec2e711a3e4a5e6e", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.7606506613547762, "ground_truth": 0}, {"key": "186210bbc060c272ff9a2412ec2e711a3e4a5e6e", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.6566582552376422, "ground_truth": 0}, {"key": "186210bbc060c272ff9a2412ec2e711a3e4a5e6e", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.5078118695158574, "ground_truth": 0}, {"key": "186210bbc060c272ff9a2412ec2e711a3e4a5e6e", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.5583270153952052, "ground_truth": 0}, {"key": "03392835ea832d7940082c421a21778c70701ff0", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.6261241569154202, "ground_truth": 0}, {"key": "03392835ea832d7940082c421a21778c70701ff0", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.7606506613547762, "ground_truth": 0}, {"key": "03392835ea832d7940082c421a21778c70701ff0", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.39606817164143643, "ground_truth": 0}, {"key": "03392835ea832d7940082c421a21778c70701ff0", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.6057990642756947, "ground_truth": 0}, {"key": "03392835ea832d7940082c421a21778c70701ff0", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.5039061701415471, "ground_truth": 0}, {"key": "e2b96982b60cbd10b39c1db4282023d0ac1f3f2a", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.7866228174296773, "ground_truth": 0}, {"key": "e2b96982b60cbd10b39c1db4282023d0ac1f3f2a", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.7534666491858443, "ground_truth": 0}, {"key": "e2b96982b60cbd10b39c1db4282023d0ac1f3f2a", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.7217432268020775, "ground_truth": 0}, {"key": "e2b96982b60cbd10b39c1db4282023d0ac1f3f2a", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.6723317111318815, "ground_truth": 0}, {"key": "e2b96982b60cbd10b39c1db4282023d0ac1f3f2a", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.6825737416957357, "ground_truth": 0}, {"key": "31310358d02c98abba71916e8cb4ef7477a2d82a", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.43206339783154385, "ground_truth": 0}, {"key": "31310358d02c98abba71916e8cb4ef7477a2d82a", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.6279512269841478, "ground_truth": 0}, {"key": "31310358d02c98abba71916e8cb4ef7477a2d82a", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.2925953031124958, "ground_truth": 0}, {"key": "31310358d02c98abba71916e8cb4ef7477a2d82a", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.4054487365754712, "ground_truth": 0}, {"key": "31310358d02c98abba71916e8cb4ef7477a2d82a", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.35936411137535273, "ground_truth": 0}, {"key": "ec0e9a0c77bbb4bba73ef5177413c666e691850d", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.7401743498831682, "ground_truth": 0}, {"key": "ec0e9a0c77bbb4bba73ef5177413c666e691850d", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.6876299880254908, "ground_truth": 0}, {"key": "ec0e9a0c77bbb4bba73ef5177413c666e691850d", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.3157359556396979, "ground_truth": 0}, {"key": "ec0e9a0c77bbb4bba73ef5177413c666e691850d", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.8509646962454561, "ground_truth": 0}, {"key": "ec0e9a0c77bbb4bba73ef5177413c666e691850d", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.4941408963658772, "ground_truth": 0}, {"key": "02311be4aab97a81d2262963896b975c27f6503d", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.8723473757866532, "ground_truth": 0}, {"key": "02311be4aab97a81d2262963896b975c27f6503d", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.887984058018025, "ground_truth": 0}, {"key": "02311be4aab97a81d2262963896b975c27f6503d", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.7839884587946067, "ground_truth": 0}, {"key": "02311be4aab97a81d2262963896b975c27f6503d", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.8984105510904665, "ground_truth": 0}, {"key": "02311be4aab97a81d2262963896b975c27f6503d", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.944587205613203, "ground_truth": 0}, {"key": "a18b463219c663ef55a0cbbf81ae489cdf877b62", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.983085087615599, "ground_truth": 0}, {"key": "a18b463219c663ef55a0cbbf81ae489cdf877b62", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.9930961620144113, "ground_truth": 0}, {"key": "a18b463219c663ef55a0cbbf81ae489cdf877b62", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.9976768376157943, "ground_truth": 0}, {"key": "a18b463219c663ef55a0cbbf81ae489cdf877b62", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.989429512371369, "ground_truth": 0}, {"key": "a18b463219c663ef55a0cbbf81ae489cdf877b62", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.9785492693308272, "ground_truth": 0}, {"key": "aa966ac9e3611ac2cef8d3fb9ceb3b58c150e238", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.7799929211436671, "ground_truth": 0}, {"key": "aa966ac9e3611ac2cef8d3fb9ceb3b58c150e238", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.8895288543426331, "ground_truth": 0}, {"key": "aa966ac9e3611ac2cef8d3fb9ceb3b58c150e238", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.8128673231776545, "ground_truth": 0}, {"key": "aa966ac9e3611ac2cef8d3fb9ceb3b58c150e238", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.7676898511434268, "ground_truth": 0}, {"key": "aa966ac9e3611ac2cef8d3fb9ceb3b58c150e238", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.5136684485186966, "ground_truth": 0}, {"key": "5215d4e6e945ba390786f1720cc5a8abf92c32fd", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.7592253973632799, "ground_truth": 0}, {"key": "5215d4e6e945ba390786f1720cc5a8abf92c32fd", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.7476159761059814, "ground_truth": 0}, {"key": "5215d4e6e945ba390786f1720cc5a8abf92c32fd", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.7201715159412244, "ground_truth": 0}, {"key": "5215d4e6e945ba390786f1720cc5a8abf92c32fd", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.7866228234079391, "ground_truth": 0}, {"key": "5215d4e6e945ba390786f1720cc5a8abf92c32fd", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.803173816160233, "ground_truth": 0}, {"key": "e7297f59909379c8eb07ea9bc2377b5e3980073d", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.2120688074154451, "ground_truth": 0}, {"key": "e7297f59909379c8eb07ea9bc2377b5e3980073d", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.1655931151078417, "ground_truth": 0}, {"key": "e7297f59909379c8eb07ea9bc2377b5e3980073d", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.29259530504582, "ground_truth": 0}, {"key": "e7297f59909379c8eb07ea9bc2377b5e3980073d", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.4455295229815226, "ground_truth": 0}, {"key": "e7297f59909379c8eb07ea9bc2377b5e3980073d", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.3611647122261808, "ground_truth": 0}, {"key": "6c5f775006a225e617c1fa4cf0c439579e1443a2", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.7620701211666527, "ground_truth": 0}, {"key": "6c5f775006a225e617c1fa4cf0c439579e1443a2", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.9309620737276809, "ground_truth": 0}, {"key": "6c5f775006a225e617c1fa4cf0c439579e1443a2", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.8661325146761838, "ground_truth": 0}, {"key": "6c5f775006a225e617c1fa4cf0c439579e1443a2", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.8661325178638541, "ground_truth": 0}, {"key": "6c5f775006a225e617c1fa4cf0c439579e1443a2", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.7264256235834982, "ground_truth": 0}, {"key": "46ce664a42eac4474d25c435a28790ec25137603", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.5117166048134335, "ground_truth": 0}, {"key": "46ce664a42eac4474d25c435a28790ec25137603", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.4610168056250507, "ground_truth": 0}, {"key": "46ce664a42eac4474d25c435a28790ec25137603", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.6113819689860046, "ground_truth": 0}, {"key": "46ce664a42eac4474d25c435a28790ec25137603", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.4610167726038106, "ground_truth": 0}, {"key": "46ce664a42eac4474d25c435a28790ec25137603", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.5486734749645098, "ground_truth": 0}, {"key": "693d73ab049f7d8f3c897922b3f7269a96a1a4fa", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.7892336950051272, "ground_truth": 0}, {"key": "693d73ab049f7d8f3c897922b3f7269a96a1a4fa", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.7476159804926066, "ground_truth": 0}, {"key": "693d73ab049f7d8f3c897922b3f7269a96a1a4fa", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.6001883564335582, "ground_truth": 0}, {"key": "693d73ab049f7d8f3c897922b3f7269a96a1a4fa", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.7918210707025478, "ground_truth": 0}, {"key": "693d73ab049f7d8f3c897922b3f7269a96a1a4fa", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.6113819905084127, "ground_truth": 0}, {"key": "48e4930e3c380330b609f460f11520be0e29d5fd", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.6513548582839152, "ground_truth": 0}, {"key": "48e4930e3c380330b609f460f11520be0e29d5fd", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.6039318336655235, "ground_truth": 0}, {"key": "48e4930e3c380330b609f460f11520be0e29d5fd", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.7185943925550506, "ground_truth": 0}, {"key": "48e4930e3c380330b609f460f11520be0e29d5fd", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.6039318421076909, "ground_truth": 0}, {"key": "48e4930e3c380330b609f460f11520be0e29d5fd", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.793105942039961, "ground_truth": 0}, {"key": "53f3e11ada213ff55b987692a2eb0c9b6d890d5e", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.6757646104795564, "ground_truth": 0}, {"key": "53f3e11ada213ff55b987692a2eb0c9b6d890d5e", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.6334102442660526, "ground_truth": 0}, {"key": "53f3e11ada213ff55b987692a2eb0c9b6d890d5e", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.5350984460979884, "ground_truth": 0}, {"key": "53f3e11ada213ff55b987692a2eb0c9b6d890d5e", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.8933094082293654, "ground_truth": 0}, {"key": "53f3e11ada213ff55b987692a2eb0c9b6d890d5e", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.6352224570824214, "ground_truth": 0}, {"key": "d2ee859acf7e35bea229f968d53240c2f1c2845c", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.7772998765239622, "ground_truth": 0}, {"key": "d2ee859acf7e35bea229f968d53240c2f1c2845c", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.9026096019398455, "ground_truth": 0}, {"key": "d2ee859acf7e35bea229f968d53240c2f1c2845c", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.6566582742813545, "ground_truth": 0}, {"key": "d2ee859acf7e35bea229f968d53240c2f1c2845c", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.8840392988951257, "ground_truth": 0}, {"key": "d2ee859acf7e35bea229f968d53240c2f1c2845c", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.8333246052829448, "ground_truth": 0}, {"key": "d4d44650eb77504fd01a730c0ccc7e6cdfcc578a", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.6926419818018135, "ground_truth": 0}, {"key": "d4d44650eb77504fd01a730c0ccc7e6cdfcc578a", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.6315942937811068, "ground_truth": 0}, {"key": "d4d44650eb77504fd01a730c0ccc7e6cdfcc578a", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.707404692385293, "ground_truth": 0}, {"key": "d4d44650eb77504fd01a730c0ccc7e6cdfcc578a", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.8397339766928884, "ground_truth": 0}, {"key": "d4d44650eb77504fd01a730c0ccc7e6cdfcc578a", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.8006919945930641, "ground_truth": 0}, {"key": "3695132378151f89d210da575bfef0a3f29aa051", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.8962513869505708, "ground_truth": 0}, {"key": "3695132378151f89d210da575bfef0a3f29aa051", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.8596637613536163, "ground_truth": 0}, {"key": "3695132378151f89d210da575bfef0a3f29aa051", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.9309620782428922, "ground_truth": 0}, {"key": "3695132378151f89d210da575bfef0a3f29aa051", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.9257686403059338, "ground_truth": 0}, {"key": "3695132378151f89d210da575bfef0a3f29aa051", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.9213576148832049, "ground_truth": 0}, {"key": "c193cecd478fa204b16500ece25bf25b75bc5265", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.5039061727359361, "ground_truth": 0}, {"key": "c193cecd478fa204b16500ece25bf25b75bc5265", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.3904758442597406, "ground_truth": 0}, {"key": "c193cecd478fa204b16500ece25bf25b75bc5265", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.5, "ground_truth": 0}, {"key": "c193cecd478fa204b16500ece25bf25b75bc5265", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.34334170772802464, "ground_truth": 0}, {"key": "c193cecd478fa204b16500ece25bf25b75bc5265", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.49023559737837735, "ground_truth": 0}, {"key": "b599d61b0c28b86dc92c7af4d40814ece8279500", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.7592254062225753, "ground_truth": 0}, {"key": "b599d61b0c28b86dc92c7af4d40814ece8279500", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.8210441146620271, "ground_truth": 0}, {"key": "b599d61b0c28b86dc92c7af4d40814ece8279500", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.7786493170903073, "ground_truth": 0}, {"key": "b599d61b0c28b86dc92c7af4d40814ece8279500", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.6169358271744496, "ground_truth": 0}, {"key": "b599d61b0c28b86dc92c7af4d40814ece8279500", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.4921881178374069, "ground_truth": 0}, {"key": "06f290a163e81c46437ca61b5fd13741d7db11f2", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.2213506895416315, "ground_truth": 0}, {"key": "06f290a163e81c46437ca61b5fd13741d7db11f2", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.27825679776207246, "ground_truth": 0}, {"key": "06f290a163e81c46437ca61b5fd13741d7db11f2", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.2829881293435068, "ground_truth": 0}, {"key": "06f290a163e81c46437ca61b5fd13741d7db11f2", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.15203224703189386, "ground_truth": 0}, {"key": "06f290a163e81c46437ca61b5fd13741d7db11f2", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.17328820151683813, "ground_truth": 0}, {"key": "46210bd0b15cd5bba64751d873674766decb2677", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.7772998604106259, "ground_truth": 0}, {"key": "46210bd0b15cd5bba64751d873674766decb2677", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.7563575373999264, "ground_truth": 0}, {"key": "46210bd0b15cd5bba64751d873674766decb2677", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.6001883654077353, "ground_truth": 0}, {"key": "46210bd0b15cd5bba64751d873674766decb2677", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.7295197825697793, "ground_truth": 0}, {"key": "46210bd0b15cd5bba64751d873674766decb2677", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.7074046887757167, "ground_truth": 0}, {"key": "cfba701dad16c47e0f7b97b8a6b043d25f740085", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.6548947252194646, "ground_truth": 0}, {"key": "cfba701dad16c47e0f7b97b8a6b043d25f740085", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.401687806904277, "ground_truth": 0}, {"key": "cfba701dad16c47e0f7b97b8a6b043d25f740085", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.5964331260934537, "ground_truth": 0}, {"key": "cfba701dad16c47e0f7b97b8a6b043d25f740085", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.6315942873991586, "ground_truth": 0}, {"key": "cfba701dad16c47e0f7b97b8a6b043d25f740085", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.3073580226955542, "ground_truth": 0}, {"key": "1c0fbe7e6758334d83d145580688e7aa1c549c53", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.4455295177270899, "ground_truth": 0}, {"key": "1c0fbe7e6758334d83d145580688e7aa1c549c53", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.4416730180579525, "ground_truth": 0}, {"key": "1c0fbe7e6758334d83d145580688e7aa1c549c53", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.567936605870509, "ground_truth": 0}, {"key": "1c0fbe7e6758334d83d145580688e7aa1c549c53", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.3557748757935854, "ground_truth": 0}, {"key": "1c0fbe7e6758334d83d145580688e7aa1c549c53", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.4726834597575197, "ground_truth": 0}, {"key": "820c917dada8b32be365eaeec9edc1ca5833cfcd", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.8233284002846109, "ground_truth": 0}, {"key": "820c917dada8b32be365eaeec9edc1ca5833cfcd", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.5660185490630512, "ground_truth": 0}, {"key": "820c917dada8b32be365eaeec9edc1ca5833cfcd", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.8816148939915242, "ground_truth": 0}, {"key": "820c917dada8b32be365eaeec9edc1ca5833cfcd", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.747615967758151, "ground_truth": 0}, {"key": "820c917dada8b32be365eaeec9edc1ca5833cfcd", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.7008948476749699, "ground_truth": 0}, {"key": "faf3821150b0c63290cbbddd7a8b54900995ea5a", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.459076113147474, "ground_truth": 0}, {"key": "faf3821150b0c63290cbbddd7a8b54900995ea5a", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.583203351195207, "ground_truth": 0}, {"key": "faf3821150b0c63290cbbddd7a8b54900995ea5a", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.5755880055913177, "ground_truth": 0}, {"key": "faf3821150b0c63290cbbddd7a8b54900995ea5a", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.6548947206653459, "ground_truth": 0}, {"key": "faf3821150b0c63290cbbddd7a8b54900995ea5a", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.5409238835397746, "ground_truth": 0}, {"key": "1de0cae2832cf41f49e6fad8254247c789dfabd2", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.44360041138984896, "ground_truth": 0}, {"key": "1de0cae2832cf41f49e6fad8254247c789dfabd2", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.618780459585957, "ground_truth": 0}, {"key": "1de0cae2832cf41f49e6fad8254247c789dfabd2", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.6132365686718865, "ground_truth": 0}, {"key": "1de0cae2832cf41f49e6fad8254247c789dfabd2", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.4902355739605388, "ground_truth": 0}, {"key": "1de0cae2832cf41f49e6fad8254247c789dfabd2", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.5312093671576054, "ground_truth": 0}, {"key": "6c6e51ef20def117ed9114ed8d8480b3a100f1c3", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.7416739846410942, "ground_truth": 0}, {"key": "6c6e51ef20def117ed9114ed8d8480b3a100f1c3", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.8679338461740788, "ground_truth": 0}, {"key": "6c6e51ef20def117ed9114ed8d8480b3a100f1c3", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.6150878635165564, "ground_truth": 0}, {"key": "6c6e51ef20def117ed9114ed8d8480b3a100f1c3", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.7217432171287302, "ground_truth": 0}, {"key": "6c6e51ef20def117ed9114ed8d8480b3a100f1c3", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.73259182342171, "ground_truth": 0}, {"key": "b8c755b8921f7917d161605d2ef404d9551f3846", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.43206338493548924, "ground_truth": 0}, {"key": "b8c755b8921f7917d161605d2ef404d9551f3846", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.46879061876094497, "ground_truth": 0}, {"key": "b8c755b8921f7917d161605d2ef404d9551f3846", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.40733340447014027, "ground_truth": 0}, {"key": "b8c755b8921f7917d161605d2ef404d9551f3846", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.4941408758760508, "ground_truth": 0}, {"key": "b8c755b8921f7917d161605d2ef404d9551f3846", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.372048782809867, "ground_truth": 0}, {"key": "dc7e18d14b8ad29abbd79f554324ec7b8ba8b9c0", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.8006920058164361, "ground_truth": 0}, {"key": "dc7e18d14b8ad29abbd79f554324ec7b8ba8b9c0", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.8872045965248218, "ground_truth": 0}, {"key": "dc7e18d14b8ad29abbd79f554324ec7b8ba8b9c0", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.8333245944256826, "ground_truth": 0}, {"key": "dc7e18d14b8ad29abbd79f554324ec7b8ba8b9c0", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.6808786183510749, "ground_truth": 0}, {"key": "dc7e18d14b8ad29abbd79f554324ec7b8ba8b9c0", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.717011864454323, "ground_truth": 0}, {"key": "a7fc90db6c296663b1b7fc057451dfd45019342d", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.4629585968612884, "ground_truth": 0}, {"key": "a7fc90db6c296663b1b7fc057451dfd45019342d", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.7170118819230955, "ground_truth": 0}, {"key": "a7fc90db6c296663b1b7fc057451dfd45019342d", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.2974699495825314, "ground_truth": 0}, {"key": "a7fc90db6c296663b1b7fc057451dfd45019342d", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.6636689324516295, "ground_truth": 0}, {"key": "a7fc90db6c296663b1b7fc057451dfd45019342d", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.4804786918208508, "ground_truth": 0}, {"key": "7f22fbc4fd81e50c632c5853856965aa4d0065d4", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.8140527995148402, "ground_truth": 0}, {"key": "7f22fbc4fd81e50c632c5853856965aa4d0065d4", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.9012274155244505, "ground_truth": 0}, {"key": "7f22fbc4fd81e50c632c5853856965aa4d0065d4", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.8947894724170538, "ground_truth": 0}, {"key": "7f22fbc4fd81e50c632c5853856965aa4d0065d4", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.7931059684061181, "ground_truth": 0}, {"key": "7f22fbc4fd81e50c632c5853856965aa4d0065d4", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.8031737947632861, "ground_truth": 0}, {"key": "309ae632df7b88a9569d81fa91aff3b9fb03529e", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.7356416322895701, "ground_truth": 0}, {"key": "309ae632df7b88a9569d81fa91aff3b9fb03529e", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.6601723770447134, "ground_truth": 0}, {"key": "309ae632df7b88a9569d81fa91aff3b9fb03529e", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.7943849640827262, "ground_truth": 0}, {"key": "309ae632df7b88a9569d81fa91aff3b9fb03529e", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.7025300621797544, "ground_truth": 0}, {"key": "309ae632df7b88a9569d81fa91aff3b9fb03529e", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.6842640038099055, "ground_truth": 0}, {"key": "732304a0901ff14d023d4361c1d41a85724808f3", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.6548947185732374, "ground_truth": 0}, {"key": "732304a0901ff14d023d4361c1d41a85724808f3", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.887984041469482, "ground_truth": 0}, {"key": "732304a0901ff14d023d4361c1d41a85724808f3", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.5117165841725178, "ground_truth": 0}, {"key": "732304a0901ff14d023d4361c1d41a85724808f3", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.447460317086856, "ground_truth": 0}, {"key": "732304a0901ff14d023d4361c1d41a85724808f3", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.480478703801404, "ground_truth": 0}, {"key": "509b9f69b376e4acb8da49d53198699b1e779ea7", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.2893716800552922, "ground_truth": 0}, {"key": "509b9f69b376e4acb8da49d53198699b1e779ea7", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.5736783959982735, "ground_truth": 0}, {"key": "509b9f69b376e4acb8da49d53198699b1e779ea7", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.4746311579869949, "ground_truth": 0}, {"key": "509b9f69b376e4acb8da49d53198699b1e779ea7", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.5039061469759312, "ground_truth": 0}, {"key": "509b9f69b376e4acb8da49d53198699b1e779ea7", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.4436004210830566, "ground_truth": 0}, {"key": "c292860b41f7c9131458cdc44a79febef38ad8a2", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.6909763095225476, "ground_truth": 0}, {"key": "c292860b41f7c9131458cdc44a79febef38ad8a2", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.7718434884907385, "ground_truth": 0}, {"key": "c292860b41f7c9131458cdc44a79febef38ad8a2", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.5717666125702126, "ground_truth": 0}, {"key": "c292860b41f7c9131458cdc44a79febef38ad8a2", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.7549149712336145, "ground_truth": 0}, {"key": "c292860b41f7c9131458cdc44a79febef38ad8a2", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.7981867766484405, "ground_truth": 0}, {"key": "6db7e70883f0241081833487c421bab86fdac26e", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.7074047004627111, "ground_truth": 0}, {"key": "6db7e70883f0241081833487c421bab86fdac26e", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.6297746172515581, "ground_truth": 0}, {"key": "6db7e70883f0241081833487c421bab86fdac26e", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.7461389888556216, "ground_truth": 0}, {"key": "6db7e70883f0241081833487c421bab86fdac26e", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.5486734775715392, "ground_truth": 0}, {"key": "6db7e70883f0241081833487c421bab86fdac26e", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.6548947462190983, "ground_truth": 0}, {"key": "e51e06234b3f49da16fec69aaee6fb9cd09cb1d8", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.5983121543097544, "ground_truth": 0}, {"key": "e51e06234b3f49da16fec69aaee6fb9cd09cb1d8", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.6334102843767166, "ground_truth": 0}, {"key": "e51e06234b3f49da16fec69aaee6fb9cd09cb1d8", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.6460137125641916, "ground_truth": 0}, {"key": "e51e06234b3f49da16fec69aaee6fb9cd09cb1d8", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.6531269193987284, "ground_truth": 0}, {"key": "e51e06234b3f49da16fec69aaee6fb9cd09cb1d8", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.809275976525584, "ground_truth": 0}, {"key": "42474528588bac3a27842671a3fa940fed450552", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.70578499773317, "ground_truth": 0}, {"key": "42474528588bac3a27842671a3fa940fed450552", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.6584175062998696, "ground_truth": 0}, {"key": "42474528588bac3a27842671a3fa940fed450552", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.7154240254230116, "ground_truth": 0}, {"key": "42474528588bac3a27842671a3fa940fed450552", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.5851011485268541, "ground_truth": 0}, {"key": "42474528588bac3a27842671a3fa940fed450552", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.6706082803002805, "ground_truth": 0}, {"key": "5932d9c8f1da55bad396197ebae0853c515180a5", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.6976088952725028, "ground_truth": 0}, {"key": "5932d9c8f1da55bad396197ebae0853c515180a5", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.5253688176087659, "ground_truth": 0}, {"key": "5932d9c8f1da55bad396197ebae0853c515180a5", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.4726834847178203, "ground_truth": 0}, {"key": "5932d9c8f1da55bad396197ebae0853c515180a5", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.30404169333273856, "ground_truth": 0}, {"key": "5932d9c8f1da55bad396197ebae0853c515180a5", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.480478665677362, "ground_truth": 0}, {"key": "daacc676fc659bfd147d11b1409ab42615a2f169", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.47463117875325117, "ground_truth": 0}, {"key": "daacc676fc659bfd147d11b1409ab42615a2f169", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.6992544100360528, "ground_truth": 0}, {"key": "daacc676fc659bfd147d11b1409ab42615a2f169", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.7025300534373482, "ground_truth": 0}, {"key": "daacc676fc659bfd147d11b1409ab42615a2f169", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.7772998655504249, "ground_truth": 0}, {"key": "daacc676fc659bfd147d11b1409ab42615a2f169", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.5563995586679181, "ground_truth": 0}, {"key": "7a02e707b139791920fb13115d6132541fff7d97", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.5640984744843035, "ground_truth": 0}, {"key": "7a02e707b139791920fb13115d6132541fff7d97", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.7386690681280518, "ground_truth": 0}, {"key": "7a02e707b139791920fb13115d6132541fff7d97", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.6757645897741198, "ground_truth": 0}, {"key": "7a02e707b139791920fb13115d6132541fff7d97", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.4054487643229769, "ground_truth": 0}, {"key": "7a02e707b139791920fb13115d6132541fff7d97", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.8244619366468651, "ground_truth": 0}, {"key": "db1972f0204c7a9c292f4c85e8838251cb26625e", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.6187804604114887, "ground_truth": 0}, {"key": "db1972f0204c7a9c292f4c85e8838251cb26625e", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.6113819452221074, "ground_truth": 0}, {"key": "db1972f0204c7a9c292f4c85e8838251cb26625e", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.5078118714144245, "ground_truth": 0}, {"key": "db1972f0204c7a9c292f4c85e8838251cb26625e", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.8976952952785717, "ground_truth": 0}, {"key": "db1972f0204c7a9c292f4c85e8838251cb26625e", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.8407825931207975, "ground_truth": 0}, {"key": "6defcdfd6995661fd681dc15163d67f6a5d6727b", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.7279754375815278, "ground_truth": 0}, {"key": "6defcdfd6995661fd681dc15163d67f6a5d6727b", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.7106282858062831, "ground_truth": 0}, {"key": "6defcdfd6995661fd681dc15163d67f6a5d6727b", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.8519528120861598, "ground_truth": 0}, {"key": "6defcdfd6995661fd681dc15163d67f6a5d6727b", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.7879312067863888, "ground_truth": 0}, {"key": "6defcdfd6995661fd681dc15163d67f6a5d6727b", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.8104789059919458, "ground_truth": 0}, {"key": "24716f5a39d23dafbe9a9df8fa002788d14d020b", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.6460136927272324, "ground_truth": 0}, {"key": "24716f5a39d23dafbe9a9df8fa002788d14d020b", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.6001883560779715, "ground_truth": 0}, {"key": "24716f5a39d23dafbe9a9df8fa002788d14d020b", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.731058572701294, "ground_truth": 0}, {"key": "24716f5a39d23dafbe9a9df8fa002788d14d020b", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.6352224392163839, "ground_truth": 0}, {"key": "24716f5a39d23dafbe9a9df8fa002788d14d020b", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.794384956052255, "ground_truth": 0}, {"key": "ab3c98cf7833b842898a568d872e45ceb2f7dda9", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.5813030928563002, "ground_truth": 0}, {"key": "ab3c98cf7833b842898a568d872e45ceb2f7dda9", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.7025300606148117, "ground_truth": 0}, {"key": "ab3c98cf7833b842898a568d872e45ceb2f7dda9", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.5, "ground_truth": 0}, {"key": "ab3c98cf7833b842898a568d872e45ceb2f7dda9", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.6424324845888146, "ground_truth": 0}, {"key": "ab3c98cf7833b842898a568d872e45ceb2f7dda9", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.5679366185938219, "ground_truth": 0}, {"key": "831005755f85012c882f17c3b3699b34a7febb7b", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.9367494795216417, "ground_truth": 0}, {"key": "831005755f85012c882f17c3b3699b34a7febb7b", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.8840392805251118, "ground_truth": 0}, {"key": "831005755f85012c882f17c3b3699b34a7febb7b", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.9213576156863488, "ground_truth": 0}, {"key": "831005755f85012c882f17c3b3699b34a7febb7b", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.8740772341951178, "ground_truth": 0}, {"key": "831005755f85012c882f17c3b3699b34a7febb7b", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.916708079100719, "ground_truth": 0}, {"key": "0590a8c653b7d332d9df195dcf3ce014abb4eff7", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.69097630446219, "ground_truth": 0}, {"key": "0590a8c653b7d332d9df195dcf3ce014abb4eff7", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.564098468903911, "ground_truth": 0}, {"key": "0590a8c653b7d332d9df195dcf3ce014abb4eff7", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.7325918317860662, "ground_truth": 0}, {"key": "0590a8c653b7d332d9df195dcf3ce014abb4eff7", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.5602526605785447, "ground_truth": 0}, {"key": "0590a8c653b7d332d9df195dcf3ce014abb4eff7", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.8311430358411623, "ground_truth": 0}, {"key": "f79341438eed40986c3219b67a3b5d87eb6c018a", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.9353465086841666, "ground_truth": 0}, {"key": "f79341438eed40986c3219b67a3b5d87eb6c018a", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.9469902294748802, "ground_truth": 0}, {"key": "f79341438eed40986c3219b67a3b5d87eb6c018a", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.9543079671047647, "ground_truth": 0}, {"key": "f79341438eed40986c3219b67a3b5d87eb6c018a", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.9606574965705285, "ground_truth": 0}, {"key": "f79341438eed40986c3219b67a3b5d87eb6c018a", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.9612438040501362, "ground_truth": 0}, {"key": "8db6225f67580d64a196f2f3197386a6be950a09", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.9766692316695339, "ground_truth": 0}, {"key": "8db6225f67580d64a196f2f3197386a6be950a09", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.9289263331842299, "ground_truth": 0}, {"key": "8db6225f67580d64a196f2f3197386a6be950a09", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.9469902241424911, "ground_truth": 0}, {"key": "8db6225f67580d64a196f2f3197386a6be950a09", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.9702399066182646, "ground_truth": 0}, {"key": "8db6225f67580d64a196f2f3197386a6be950a09", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.9372107873998731, "ground_truth": 0}, {"key": "e386d9ed70bac668fa6048b572f445d9b7b62f75", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.4301473810173902, "ground_truth": 0}, {"key": "e386d9ed70bac668fa6048b572f445d9b7b62f75", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.5136684642836732, "ground_truth": 0}, {"key": "e386d9ed70bac668fa6048b572f445d9b7b62f75", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.6636689604535002, "ground_truth": 0}, {"key": "e386d9ed70bac668fa6048b572f445d9b7b62f75", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.8255897280695395, "ground_truth": 0}, {"key": "e386d9ed70bac668fa6048b572f445d9b7b62f75", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.40356687504784167, "ground_truth": 0}, {"key": "e35669d4530ea55bc8f0e451268cab9e9eaeab92", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.5273165309878276, "ground_truth": 0}, {"key": "e35669d4530ea55bc8f0e451268cab9e9eaeab92", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.6859494783344786, "ground_truth": 0}, {"key": "e35669d4530ea55bc8f0e451268cab9e9eaeab92", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.7592254022931418, "ground_truth": 0}, {"key": "e35669d4530ea55bc8f0e451268cab9e9eaeab92", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.7461389976764522, "ground_truth": 0}, {"key": "e35669d4530ea55bc8f0e451268cab9e9eaeab92", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.6370308001530296, "ground_truth": 0}, {"key": "d3ca193f45aef9aa766d52fbc58d6b8f1658ee60", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.37754066008922826, "ground_truth": 0}, {"key": "d3ca193f45aef9aa766d52fbc58d6b8f1658ee60", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.5195213282116542, "ground_truth": 0}, {"key": "d3ca193f45aef9aa766d52fbc58d6b8f1658ee60", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.42059961268200674, "ground_truth": 0}, {"key": "d3ca193f45aef9aa766d52fbc58d6b8f1658ee60", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.28937170048865485, "ground_truth": 0}, {"key": "d3ca193f45aef9aa766d52fbc58d6b8f1658ee60", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.5428632774683867, "ground_truth": 0}, {"key": "1ca9bf09bf534add02b7cfe6ebae6d17cde66286", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.7826624689502366, "ground_truth": 0}, {"key": "1ca9bf09bf534add02b7cfe6ebae6d17cde66286", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.896975575753369, "ground_truth": 0}, {"key": "1ca9bf09bf534add02b7cfe6ebae6d17cde66286", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.8469578592626983, "ground_truth": 0}, {"key": "1ca9bf09bf534add02b7cfe6ebae6d17cde66286", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.9343951691658205, "ground_truth": 0}, {"key": "1ca9bf09bf534add02b7cfe6ebae6d17cde66286", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.9032942090921018, "ground_truth": 0}, {"key": "c296e88117bef515bd9b36ad560223df3fd2b84c", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.667147659675142, "ground_truth": 0}, {"key": "c296e88117bef515bd9b36ad560223df3fd2b84c", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.3345894451902672, "ground_truth": 0}, {"key": "c296e88117bef515bd9b36ad560223df3fd2b84c", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.6909762801212838, "ground_truth": 0}, {"key": "c296e88117bef515bd9b36ad560223df3fd2b84c", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.5136684848386645, "ground_truth": 0}, {"key": "c296e88117bef515bd9b36ad560223df3fd2b84c", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.8596637414842241, "ground_truth": 0}, {"key": "c5e11ee4c2f0ae511bd0e1fae2978d070b1efc15", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.8300437684009151, "ground_truth": 0}, {"key": "c5e11ee4c2f0ae511bd0e1fae2978d070b1efc15", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.8164063852924812, "ground_truth": 0}, {"key": "c5e11ee4c2f0ae511bd0e1fae2978d070b1efc15", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.6876299791343035, "ground_truth": 0}, {"key": "c5e11ee4c2f0ae511bd0e1fae2978d070b1efc15", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.8558511482169185, "ground_truth": 0}, {"key": "c5e11ee4c2f0ae511bd0e1fae2978d070b1efc15", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.8615382110185008, "ground_truth": 0}, {"key": "1fc2d1ecf1ffdc2f0b642b686e1c21de53a4fd28", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.37022538600733756, "ground_truth": 0}, {"key": "1fc2d1ecf1ffdc2f0b642b686e1c21de53a4fd28", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.5448013915056761, "ground_truth": 0}, {"key": "1fc2d1ecf1ffdc2f0b642b686e1c21de53a4fd28", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.4921881203065932, "ground_truth": 0}, {"key": "1fc2d1ecf1ffdc2f0b642b686e1c21de53a4fd28", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.40544873202840187, "ground_truth": 0}, {"key": "1fc2d1ecf1ffdc2f0b642b686e1c21de53a4fd28", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.6076631639850417, "ground_truth": 0}, {"key": "6556c64821ece8123c130b27285efe9619c3c7fd", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.33111971913611454, "ground_truth": 0}, {"key": "6556c64821ece8123c130b27285efe9619c3c7fd", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.48438006255328764, "ground_truth": 0}, {"key": "6556c64821ece8123c130b27285efe9619c3c7fd", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.6976089001425071, "ground_truth": 0}, {"key": "6556c64821ece8123c130b27285efe9619c3c7fd", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.4843800725792243, "ground_truth": 0}, {"key": "6556c64821ece8123c130b27285efe9619c3c7fd", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.8255897239486755, "ground_truth": 0}, {"key": "32ba61f4513f7ec21cedb6ddd2a8a93260f8cd56", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.5544704548292853, "ground_truth": 0}, {"key": "32ba61f4513f7ec21cedb6ddd2a8a93260f8cd56", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.777299853153277, "ground_truth": 0}, {"key": "32ba61f4513f7ec21cedb6ddd2a8a93260f8cd56", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.633410270599555, "ground_truth": 0}, {"key": "32ba61f4513f7ec21cedb6ddd2a8a93260f8cd56", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.7969253766399819, "ground_truth": 0}, {"key": "32ba61f4513f7ec21cedb6ddd2a8a93260f8cd56", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.6842640158519875, "ground_truth": 0}, {"key": "1146cfc5981ce23511ac1bac5f3957c30bebc7b8", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.21469143273635224, "ground_truth": 0}, {"key": "1146cfc5981ce23511ac1bac5f3957c30bebc7b8", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.5136684833304495, "ground_truth": 0}, {"key": "1146cfc5981ce23511ac1bac5f3957c30bebc7b8", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.5563995695942304, "ground_truth": 0}, {"key": "1146cfc5981ce23511ac1bac5f3957c30bebc7b8", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.5234203239482017, "ground_truth": 0}, {"key": "1146cfc5981ce23511ac1bac5f3957c30bebc7b8", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.43014735401192716, "ground_truth": 0}, {"key": "e060abdb2a5e2ce6152ca0ed53703a9d17b2df36", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.5097643794893887, "ground_truth": 0}, {"key": "e060abdb2a5e2ce6152ca0ed53703a9d17b2df36", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.6076631619174135, "ground_truth": 0}, {"key": "e060abdb2a5e2ce6152ca0ed53703a9d17b2df36", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.49218811987956934, "ground_truth": 0}, {"key": "e060abdb2a5e2ce6152ca0ed53703a9d17b2df36", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.6671476751532476, "ground_truth": 0}, {"key": "e060abdb2a5e2ce6152ca0ed53703a9d17b2df36", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.6671476760130676, "ground_truth": 0}, {"key": "aef2a80ff67e87a8c165a481ede2a643128f4aa7", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.7057850361674065, "ground_truth": 0}, {"key": "aef2a80ff67e87a8c165a481ede2a643128f4aa7", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.6825737213403389, "ground_truth": 0}, {"key": "aef2a80ff67e87a8c165a481ede2a643128f4aa7", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.49218813252192467, "ground_truth": 0}, {"key": "aef2a80ff67e87a8c165a481ede2a643128f4aa7", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.7008948105776414, "ground_truth": 0}, {"key": "aef2a80ff67e87a8c165a481ede2a643128f4aa7", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.7185943927155356, "ground_truth": 0}, {"key": "d4eaedd7f1055f95e9cafa21e870d049f5df8526", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.20181322248631323, "ground_truth": 0}, {"key": "d4eaedd7f1055f95e9cafa21e870d049f5df8526", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.30074560075415496, "ground_truth": 0}, {"key": "d4eaedd7f1055f95e9cafa21e870d049f5df8526", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.15713685397236105, "ground_truth": 0}, {"key": "d4eaedd7f1055f95e9cafa21e870d049f5df8526", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.29098087750163054, "ground_truth": 0}, {"key": "d4eaedd7f1055f95e9cafa21e870d049f5df8526", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.19682621268518669, "ground_truth": 0}, {"key": "ec9531cd58e385f0da60e23b2855a3c5ece3f270", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.4746312020101492, "ground_truth": 0}, {"key": "ec9531cd58e385f0da60e23b2855a3c5ece3f270", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.503906193971255, "ground_truth": 0}, {"key": "ec9531cd58e385f0da60e23b2855a3c5ece3f270", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.49804686111775814, "ground_truth": 0}, {"key": "ec9531cd58e385f0da60e23b2855a3c5ece3f270", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.6076631803633654, "ground_truth": 0}, {"key": "ec9531cd58e385f0da60e23b2855a3c5ece3f270", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.41111088234932236, "ground_truth": 0}, {"key": "b171bad51c8ec09118fd553347c41d9301f195ee", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.8976952937903129, "ground_truth": 0}, {"key": "b171bad51c8ec09118fd553347c41d9301f195ee", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.7264256048617819, "ground_truth": 0}, {"key": "b171bad51c8ec09118fd553347c41d9301f195ee", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.8749346177074362, "ground_truth": 0}, {"key": "b171bad51c8ec09118fd553347c41d9301f195ee", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.9086178929174804, "ground_truth": 0}, {"key": "b171bad51c8ec09118fd553347c41d9301f195ee", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.7520125533448646, "ground_truth": 0}, {"key": "1df14bd442bd39ed653aa77a1e77105d4b321db0", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.5736784001326187, "ground_truth": 0}, {"key": "1df14bd442bd39ed653aa77a1e77105d4b321db0", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.9407897431365577, "ground_truth": 0}, {"key": "1df14bd442bd39ed653aa77a1e77105d4b321db0", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.9329437146630963, "ground_truth": 0}, {"key": "1df14bd442bd39ed653aa77a1e77105d4b321db0", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.8940517223786161, "ground_truth": 0}, {"key": "1df14bd442bd39ed653aa77a1e77105d4b321db0", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.9536217918093602, "ground_truth": 0}, {"key": "d4f57e3c18c38696345fb7a3d76a151bb9c5123b", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.31573597453923274, "ground_truth": 0}, {"key": "d4f57e3c18c38696345fb7a3d76a151bb9c5123b", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.29421497413296244, "ground_truth": 0}, {"key": "d4f57e3c18c38696345fb7a3d76a151bb9c5123b", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.46684560427992267, "ground_truth": 0}, {"key": "d4f57e3c18c38696345fb7a3d76a151bb9c5123b", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.2351083794139883, "ground_truth": 0}, {"key": "d4f57e3c18c38696345fb7a3d76a151bb9c5123b", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.4687906388130936, "ground_truth": 0}, {"key": "28bbbf57c580be154f0602cbfe8b63603ef5a3a4", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.3090237030648373, "ground_truth": 0}, {"key": "28bbbf57c580be154f0602cbfe8b63603ef5a3a4", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.3415824904234267, "ground_truth": 0}, {"key": "28bbbf57c580be154f0602cbfe8b63603ef5a3a4", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.2814056128526365, "ground_truth": 0}, {"key": "28bbbf57c580be154f0602cbfe8b63603ef5a3a4", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.47268348109515873, "ground_truth": 0}, {"key": "28bbbf57c580be154f0602cbfe8b63603ef5a3a4", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.548673488516796, "ground_truth": 0}, {"key": "05850904cabf491c9ab7c0e0d85fd932eb8c0bb0", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.6601723826419641, "ground_truth": 0}, {"key": "05850904cabf491c9ab7c0e0d85fd932eb8c0bb0", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.4436004197476774, "ground_truth": 0}, {"key": "05850904cabf491c9ab7c0e0d85fd932eb8c0bb0", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.413003581618624, "ground_truth": 0}, {"key": "05850904cabf491c9ab7c0e0d85fd932eb8c0bb0", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.32252599965934203, "ground_truth": 0}, {"key": "05850904cabf491c9ab7c0e0d85fd932eb8c0bb0", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.5136684605683615, "ground_truth": 0}, {"key": "df79c0f955e4ccf51ad45780f865e334d3577bf5", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.6774740324559732, "ground_truth": 0}, {"key": "df79c0f955e4ccf51ad45780f865e334d3577bf5", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.482429098243751, "ground_truth": 0}, {"key": "df79c0f955e4ccf51ad45780f865e334d3577bf5", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.5602526616308355, "ground_truth": 0}, {"key": "df79c0f955e4ccf51ad45780f865e334d3577bf5", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.670608296692517, "ground_truth": 0}, {"key": "df79c0f955e4ccf51ad45780f865e334d3577bf5", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.7201714954292736, "ground_truth": 0}, {"key": "ffb8b9be838da033f6f3383f324d425556723147", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.7704647953972368, "ground_truth": 0}, {"key": "ffb8b9be838da033f6f3383f324d425556723147", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.3904758480725473, "ground_truth": 0}, {"key": "ffb8b9be838da033f6f3383f324d425556723147", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.7634837740740529, "ground_truth": 0}, {"key": "ffb8b9be838da033f6f3383f324d425556723147", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.7122321836666091, "ground_truth": 0}, {"key": "ffb8b9be838da033f6f3383f324d425556723147", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.5019531216386582, "ground_truth": 0}, {"key": "d70dcffc2c07e08cc121d7126ada53dbc479626e", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.470736599768044, "ground_truth": 0}, {"key": "d70dcffc2c07e08cc121d7126ada53dbc479626e", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.5370413843231387, "ground_truth": 0}, {"key": "d70dcffc2c07e08cc121d7126ada53dbc479626e", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.44746033712740485, "ground_truth": 0}, {"key": "d70dcffc2c07e08cc121d7126ada53dbc479626e", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.2674081538997263, "ground_truth": 0}, {"key": "d70dcffc2c07e08cc121d7126ada53dbc479626e", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.4726834636338794, "ground_truth": 0}, {"key": "4dc0cef39980df6382f9aee5e150e904fe62965e", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.8333245987514727, "ground_truth": 0}, {"key": "4dc0cef39980df6382f9aee5e150e904fe62965e", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.7371581754289563, "ground_truth": 0}, {"key": "4dc0cef39980df6382f9aee5e150e904fe62965e", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.6909762758429164, "ground_truth": 0}, {"key": "4dc0cef39980df6382f9aee5e150e904fe62965e", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.6513548456177418, "ground_truth": 0}, {"key": "4dc0cef39980df6382f9aee5e150e904fe62965e", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.592666585466564, "ground_truth": 0}, {"key": "6cb082c504e00c93686ff1e9287a84ba13c12b79", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.30404168790852626, "ground_truth": 0}, {"key": "6cb082c504e00c93686ff1e9287a84ba13c12b79", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.2068940644822089, "ground_truth": 0}, {"key": "6cb082c504e00c93686ff1e9287a84ba13c12b79", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.2509127955962235, "ground_truth": 0}, {"key": "6cb082c504e00c93686ff1e9287a84ba13c12b79", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.12336561167844524, "ground_truth": 0}, {"key": "6cb082c504e00c93686ff1e9287a84ba13c12b79", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.25091278593108646, "ground_truth": 0}, {"key": "19fe2a8e0bef37b495afcc83c2f46b60c56039bf", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.7918210716122329, "ground_truth": 0}, {"key": "19fe2a8e0bef37b495afcc83c2f46b60c56039bf", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.6224593355042864, "ground_truth": 0}, {"key": "19fe2a8e0bef37b495afcc83c2f46b60c56039bf", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.7759445528683453, "ground_truth": 0}, {"key": "19fe2a8e0bef37b495afcc83c2f46b60c56039bf", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.7185943990573589, "ground_truth": 0}, {"key": "19fe2a8e0bef37b495afcc83c2f46b60c56039bf", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.6279512023806525, "ground_truth": 0}, {"key": "503c6aaeaf0e61372a896ebe1fdf2a2492844fe4", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.635222419164967, "ground_truth": 0}, {"key": "503c6aaeaf0e61372a896ebe1fdf2a2492844fe4", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.5832033726779062, "ground_truth": 0}, {"key": "503c6aaeaf0e61372a896ebe1fdf2a2492844fe4", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.6169358155183452, "ground_truth": 0}, {"key": "503c6aaeaf0e61372a896ebe1fdf2a2492844fe4", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.6548947199679219, "ground_truth": 0}, {"key": "503c6aaeaf0e61372a896ebe1fdf2a2492844fe4", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.6513548575928584, "ground_truth": 0}, {"key": "e4007135fdafe84907e2b018da3a4c7ab853c251", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.4320634083650703, "ground_truth": 0}, {"key": "e4007135fdafe84907e2b018da3a4c7ab853c251", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.5888891232092431, "ground_truth": 0}, {"key": "e4007135fdafe84907e2b018da3a4c7ab853c251", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.5292633790680631, "ground_truth": 0}, {"key": "e4007135fdafe84907e2b018da3a4c7ab853c251", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.5039061664684489, "ground_truth": 0}, {"key": "e4007135fdafe84907e2b018da3a4c7ab853c251", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.6926419755660318, "ground_truth": 0}, {"key": "5b97a507eed113ce329e8c85078fb53033bbe567", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.34864513542251624, "ground_truth": 0}, {"key": "5b97a507eed113ce329e8c85078fb53033bbe567", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.39047582057692115, "ground_truth": 0}, {"key": "5b97a507eed113ce329e8c85078fb53033bbe567", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.4092208130171496, "ground_truth": 0}, {"key": "5b97a507eed113ce329e8c85078fb53033bbe567", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.1812632023603699, "ground_truth": 0}, {"key": "5b97a507eed113ce329e8c85078fb53033bbe567", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.6495786229168262, "ground_truth": 0}, {"key": "145a118e355e3a92383b41307a5b473a7c77a8bb", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.4474602627965126, "ground_truth": 0}, {"key": "145a118e355e3a92383b41307a5b473a7c77a8bb", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.37754064364556345, "ground_truth": 0}, {"key": "145a118e355e3a92383b41307a5b473a7c77a8bb", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.7325918087706909, "ground_truth": 0}, {"key": "145a118e355e3a92383b41307a5b473a7c77a8bb", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.7185943673833606, "ground_truth": 0}, {"key": "145a118e355e3a92383b41307a5b473a7c77a8bb", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.4397473275430017, "ground_truth": 0}, {"key": "1f6309c88c5711b2b579e3c0cf699c44d3b56d16", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.31912137981686317, "ground_truth": 0}, {"key": "1f6309c88c5711b2b579e3c0cf699c44d3b56d16", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.3849121425972297, "ground_truth": 0}, {"key": "1f6309c88c5711b2b579e3c0cf699c44d3b56d16", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.3242353892348436, "ground_truth": 0}, {"key": "1f6309c88c5711b2b579e3c0cf699c44d3b56d16", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.40733342339946155, "ground_truth": 0}, {"key": "1f6309c88c5711b2b579e3c0cf699c44d3b56d16", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.41869690116137886, "ground_truth": 0}, {"key": "d8304c60e76a4b16053e74c50abd886dcdf7397c", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.5926666041441706, "ground_truth": 0}, {"key": "d8304c60e76a4b16053e74c50abd886dcdf7397c", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.5640984624081763, "ground_truth": 0}, {"key": "d8304c60e76a4b16053e74c50abd886dcdf7397c", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.7662936453855241, "ground_truth": 0}, {"key": "d8304c60e76a4b16053e74c50abd886dcdf7397c", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.5945512604862708, "ground_truth": 0}, {"key": "d8304c60e76a4b16053e74c50abd886dcdf7397c", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.7008948051812453, "ground_truth": 0}, {"key": "d47e5724a866cf365428dbded7740555e5f80f2b", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.21206880356260255, "ground_truth": 0}, {"key": "d47e5724a866cf365428dbded7740555e5f80f2b", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.5583269706658149, "ground_truth": 0}, {"key": "d47e5724a866cf365428dbded7740555e5f80f2b", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.2689414293687285, "ground_truth": 0}, {"key": "d47e5724a866cf365428dbded7740555e5f80f2b", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.37570647273056856, "ground_truth": 0}, {"key": "d47e5724a866cf365428dbded7740555e5f80f2b", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.3007455911546914, "ground_truth": 0}, {"key": "0a078513cee66db2ccaaca1b7b0755c96f0c5c8a", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.8568123006091859, "ground_truth": 0}, {"key": "0a078513cee66db2ccaaca1b7b0755c96f0c5c8a", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.9079671366301516, "ground_truth": 0}, {"key": "0a078513cee66db2ccaaca1b7b0755c96f0c5c8a", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.8895288496173269, "ground_truth": 0}, {"key": "0a078513cee66db2ccaaca1b7b0755c96f0c5c8a", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.8300437862204119, "ground_truth": 0}, {"key": "0a078513cee66db2ccaaca1b7b0755c96f0c5c8a", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.7813306067672027, "ground_truth": 0}, {"key": "f0d93bdd383762936746b48f7e67ffe72cfb1ede", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.5428632711331629, "ground_truth": 0}, {"key": "f0d93bdd383762936746b48f7e67ffe72cfb1ede", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.5851011635954383, "ground_truth": 0}, {"key": "f0d93bdd383762936746b48f7e67ffe72cfb1ede", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.42250462292543484, "ground_truth": 0}, {"key": "f0d93bdd383762936746b48f7e67ffe72cfb1ede", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.4765796456211981, "ground_truth": 0}, {"key": "f0d93bdd383762936746b48f7e67ffe72cfb1ede", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.3738757915590133, "ground_truth": 0}, {"key": "38649fdccec39afa649297349b2ad2e5e1a39d82", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.5525397285614563, "ground_truth": 0}, {"key": "38649fdccec39afa649297349b2ad2e5e1a39d82", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.7025300565029272, "ground_truth": 0}, {"key": "38649fdccec39afa649297349b2ad2e5e1a39d82", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.5640984957938217, "ground_truth": 0}, {"key": "38649fdccec39afa649297349b2ad2e5e1a39d82", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.44360040743741236, "ground_truth": 0}, {"key": "38649fdccec39afa649297349b2ad2e5e1a39d82", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.39420097489130995, "ground_truth": 0}, {"key": "d86d9a4e0b39556578f24ff54ed82716f0375fdb", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.6740504781970876, "ground_truth": 0}, {"key": "d86d9a4e0b39556578f24ff54ed82716f0375fdb", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.7041601192120601, "ground_truth": 0}, {"key": "d86d9a4e0b39556578f24ff54ed82716f0375fdb", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.8267117933300703, "ground_truth": 0}, {"key": "d86d9a4e0b39556578f24ff54ed82716f0375fdb", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.8140527893216629, "ground_truth": 0}, {"key": "d86d9a4e0b39556578f24ff54ed82716f0375fdb", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.7476159458607169, "ground_truth": 0}, {"key": "d10d57811499caa54276d3e14f89c45cb1a8958f", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.3593641344151729, "ground_truth": 0}, {"key": "d10d57811499caa54276d3e14f89c45cb1a8958f", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.28298811460870416, "ground_truth": 0}, {"key": "d10d57811499caa54276d3e14f89c45cb1a8958f", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.4746311784817395, "ground_truth": 0}, {"key": "d10d57811499caa54276d3e14f89c45cb1a8958f", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.19436782684888207, "ground_truth": 0}, {"key": "d10d57811499caa54276d3e14f89c45cb1a8958f", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.5019531419278148, "ground_truth": 0}, {"key": "66646c49afb65308491ec8ca6db79aa76263cc69", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.4824291607155342, "ground_truth": 0}, {"key": "66646c49afb65308491ec8ca6db79aa76263cc69", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.6132365292184825, "ground_truth": 0}, {"key": "66646c49afb65308491ec8ca6db79aa76263cc69", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.5370413810637861, "ground_truth": 0}, {"key": "66646c49afb65308491ec8ca6db79aa76263cc69", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.6279512054239734, "ground_truth": 0}, {"key": "66646c49afb65308491ec8ca6db79aa76263cc69", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.4765796452438717, "ground_truth": 0}, {"key": "7fbd6d867def06f6ae4c051562dc36ab8d0038c0", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.7577943778520109, "ground_truth": 0}, {"key": "7fbd6d867def06f6ae4c051562dc36ab8d0038c0", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.5467381413532598, "ground_truth": 0}, {"key": "7fbd6d867def06f6ae4c051562dc36ab8d0038c0", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.5926665973974748, "ground_truth": 0}, {"key": "7fbd6d867def06f6ae4c051562dc36ab8d0038c0", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.43782350476074333, "ground_truth": 0}, {"key": "7fbd6d867def06f6ae4c051562dc36ab8d0038c0", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.538983191651976, "ground_truth": 0}, {"key": "5c243b51bf4de7f6974338d71ac26317254007bb", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.8998277799222165, "ground_truth": 0}, {"key": "5c243b51bf4de7f6974338d71ac26317254007bb", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.7676898661135008, "ground_truth": 0}, {"key": "5c243b51bf4de7f6974338d71ac26317254007bb", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.9597620566634056, "ground_truth": 0}, {"key": "5c243b51bf4de7f6974338d71ac26317254007bb", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.7866228285683559, "ground_truth": 0}, {"key": "5c243b51bf4de7f6974338d71ac26317254007bb", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.8568122863339984, "ground_truth": 0}, {"key": "56b79c03a77d5261382e4705f3537396473f55cf", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.766293642026588, "ground_truth": 0}, {"key": "56b79c03a77d5261382e4705f3537396473f55cf", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.905322298200606, "ground_truth": 0}, {"key": "56b79c03a77d5261382e4705f3537396473f55cf", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.8311430576352689, "ground_truth": 0}, {"key": "56b79c03a77d5261382e4705f3537396473f55cf", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.819893354773375, "ground_truth": 0}, {"key": "56b79c03a77d5261382e4705f3537396473f55cf", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.8856314797794107, "ground_truth": 0}, {"key": "7382d171d71d3219c5ad0a13ea0ac92ac6b6998b", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.7386690493707939, "ground_truth": 0}, {"key": "7382d171d71d3219c5ad0a13ea0ac92ac6b6998b", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.77046479188809, "ground_truth": 0}, {"key": "7382d171d71d3219c5ad0a13ea0ac92ac6b6998b", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.5312094103774889, "ground_truth": 0}, {"key": "7382d171d71d3219c5ad0a13ea0ac92ac6b6998b", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.7918210999179927, "ground_truth": 0}, {"key": "7382d171d71d3219c5ad0a13ea0ac92ac6b6998b", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.7704648019029187, "ground_truth": 0}, {"key": "ef1a5fa8dbba16e4d7ef3fc8cd540c2f55691fc8", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.5907792058473325, "ground_truth": 0}, {"key": "ef1a5fa8dbba16e4d7ef3fc8cd540c2f55691fc8", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.6601723783113093, "ground_truth": 0}, {"key": "ef1a5fa8dbba16e4d7ef3fc8cd540c2f55691fc8", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.8175744681900518, "ground_truth": 0}, {"key": "ef1a5fa8dbba16e4d7ef3fc8cd540c2f55691fc8", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.5, "ground_truth": 0}, {"key": "ef1a5fa8dbba16e4d7ef3fc8cd540c2f55691fc8", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.7520125522431699, "ground_truth": 0}, {"key": "1ba0f66a7f4f23171634a3455893f4d5b8b94db4", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.5964331318033355, "ground_truth": 0}, {"key": "1ba0f66a7f4f23171634a3455893f4d5b8b94db4", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.5117165937992874, "ground_truth": 0}, {"key": "1ba0f66a7f4f23171634a3455893f4d5b8b94db4", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.45907614523049606, "ground_truth": 0}, {"key": "1ba0f66a7f4f23171634a3455893f4d5b8b94db4", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.3830641851846676, "ground_truth": 0}, {"key": "1ba0f66a7f4f23171634a3455893f4d5b8b94db4", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.3886180222925888, "ground_truth": 0}, {"key": "3131e8ba238a31d83cad00bc7b02933b0a3587b3", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.47852884086620223, "ground_truth": 0}, {"key": "3131e8ba238a31d83cad00bc7b02933b0a3587b3", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.37754064364556345, "ground_truth": 0}, {"key": "3131e8ba238a31d83cad00bc7b02933b0a3587b3", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.6206216100244277, "ground_truth": 0}, {"key": "3131e8ba238a31d83cad00bc7b02933b0a3587b3", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.7185943673833606, "ground_truth": 0}, {"key": "3131e8ba238a31d83cad00bc7b02933b0a3587b3", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.4397473275430017, "ground_truth": 0}, {"key": "112bc4ab4b6e7d6dd35fc33cd946fbfc4c9356d6", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.30404167910785124, "ground_truth": 0}, {"key": "112bc4ab4b6e7d6dd35fc33cd946fbfc4c9356d6", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.5525396995641702, "ground_truth": 0}, {"key": "112bc4ab4b6e7d6dd35fc33cd946fbfc4c9356d6", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.4167966405201427, "ground_truth": 0}, {"key": "112bc4ab4b6e7d6dd35fc33cd946fbfc4c9356d6", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.5331544072193293, "ground_truth": 0}, {"key": "112bc4ab4b6e7d6dd35fc33cd946fbfc4c9356d6", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.3593641552755748, "ground_truth": 0}, {"key": "3b1d3309825780556178569cd40d880a793f8da7", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.2479874328341531, "ground_truth": 0}, {"key": "3b1d3309825780556178569cd40d880a793f8da7", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.22270014329264853, "ground_truth": 0}, {"key": "3b1d3309825780556178569cd40d880a793f8da7", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.17895589881515617, "ground_truth": 0}, {"key": "3b1d3309825780556178569cd40d880a793f8da7", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.41869688443181446, "ground_truth": 0}, {"key": "3b1d3309825780556178569cd40d880a793f8da7", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.6723317109936701, "ground_truth": 0}, {"key": "c977693b405a89cec98e53b05199e608fd6adeca", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.4225046416772911, "ground_truth": 0}, {"key": "c977693b405a89cec98e53b05199e608fd6adeca", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.679178697815816, "ground_truth": 0}, {"key": "c977693b405a89cec98e53b05199e608fd6adeca", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.5448014247518934, "ground_truth": 0}, {"key": "c977693b405a89cec98e53b05199e608fd6adeca", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.4863315332511174, "ground_truth": 0}, {"key": "c977693b405a89cec98e53b05199e608fd6adeca", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.7620701151517354, "ground_truth": 0}, {"key": "c84e272a80fa95f863e016bc54df0841fd83fc12", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.5717666220534022, "ground_truth": 0}, {"key": "c84e272a80fa95f863e016bc54df0841fd83fc12", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.6352224411903042, "ground_truth": 0}, {"key": "c84e272a80fa95f863e016bc54df0841fd83fc12", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.6791787056834697, "ground_truth": 0}, {"key": "c84e272a80fa95f863e016bc54df0841fd83fc12", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.6654105472051192, "ground_truth": 0}, {"key": "c84e272a80fa95f863e016bc54df0841fd83fc12", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.7154240216084772, "ground_truth": 0}, {"key": "f51cff1d73cd0f3954376d7b3eab1d5b2ccb354c", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.8221891293250648, "ground_truth": 0}, {"key": "f51cff1d73cd0f3954376d7b3eab1d5b2ccb354c", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.7185944008904479, "ground_truth": 0}, {"key": "f51cff1d73cd0f3954376d7b3eab1d5b2ccb354c", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.49414090758693935, "ground_truth": 0}, {"key": "f51cff1d73cd0f3954376d7b3eab1d5b2ccb354c", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.5409238591683463, "ground_truth": 0}, {"key": "f51cff1d73cd0f3954376d7b3eab1d5b2ccb354c", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.6150878341343181, "ground_truth": 0}, {"key": "a98f1a0258f641788e570264b79e5c816f80054f", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.5214711397444095, "ground_truth": 0}, {"key": "a98f1a0258f641788e570264b79e5c816f80054f", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.2568319939232607, "ground_truth": 0}, {"key": "a98f1a0258f641788e570264b79e5c816f80054f", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.5156199117480349, "ground_truth": 0}, {"key": "a98f1a0258f641788e570264b79e5c816f80054f", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.5888891377605852, "ground_truth": 0}, {"key": "a98f1a0258f641788e570264b79e5c816f80054f", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.5506073403351553, "ground_truth": 0}, {"key": "d69d50059c96bd729e9e4c54eee7901d43c0181d", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.7476159612820341, "ground_truth": 0}, {"key": "d69d50059c96bd729e9e4c54eee7901d43c0181d", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.7549149987662371, "ground_truth": 0}, {"key": "d69d50059c96bd729e9e4c54eee7901d43c0181d", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.783988467927837, "ground_truth": 0}, {"key": "d69d50059c96bd729e9e4c54eee7901d43c0181d", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.6370308121766753, "ground_truth": 0}, {"key": "d69d50059c96bd729e9e4c54eee7901d43c0181d", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.5039061585774, "ground_truth": 0}, {"key": "379692c378381f092c0bae0516ea8abc5bdb98b8", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.5292634039134833, "ground_truth": 0}, {"key": "379692c378381f092c0bae0516ea8abc5bdb98b8", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.4843800817450301, "ground_truth": 0}, {"key": "379692c378381f092c0bae0516ea8abc5bdb98b8", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.6224593105011854, "ground_truth": 0}, {"key": "379692c378381f092c0bae0516ea8abc5bdb98b8", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.4455295314657978, "ground_truth": 0}, {"key": "379692c378381f092c0bae0516ea8abc5bdb98b8", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.7090191111695854, "ground_truth": 0}, {"key": "88b0d86cd06cd05a090f6a6c3a3ed17bf5f96df3", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.38861802338687906, "ground_truth": 0}, {"key": "88b0d86cd06cd05a090f6a6c3a3ed17bf5f96df3", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.7956580945674842, "ground_truth": 0}, {"key": "88b0d86cd06cd05a090f6a6c3a3ed17bf5f96df3", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.6893055965800778, "ground_truth": 0}, {"key": "88b0d86cd06cd05a090f6a6c3a3ed17bf5f96df3", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.7090191428415925, "ground_truth": 0}, {"key": "88b0d86cd06cd05a090f6a6c3a3ed17bf5f96df3", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.7122321807295279, "ground_truth": 0}, {"key": "3b46e80db81819fdcb8b8044941f64d0fa5abd11", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.7185944130486118, "ground_truth": 0}, {"key": "3b46e80db81819fdcb8b8044941f64d0fa5abd11", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.6477982263724054, "ground_truth": 0}, {"key": "3b46e80db81819fdcb8b8044941f64d0fa5abd11", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.6352224522952251, "ground_truth": 0}, {"key": "3b46e80db81819fdcb8b8044941f64d0fa5abd11", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.8221891165150218, "ground_truth": 0}, {"key": "3b46e80db81819fdcb8b8044941f64d0fa5abd11", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.7431679870361536, "ground_truth": 0}, {"key": "786d56f09dae2902696b680395353986051a1139", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.25386102889683654, "ground_truth": 0}, {"key": "786d56f09dae2902696b680395353986051a1139", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.3702253660469174, "ground_truth": 0}, {"key": "786d56f09dae2902696b680395353986051a1139", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.6057990607447549, "ground_truth": 0}, {"key": "786d56f09dae2902696b680395353986051a1139", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.23792990758808824, "ground_truth": 0}, {"key": "786d56f09dae2902696b680395353986051a1139", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.23510839258604216, "ground_truth": 0}, {"key": "bf1a3fd65fdd6e91ccec0663d80fa567eada14df", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.8766343895578154, "ground_truth": 0}, {"key": "bf1a3fd65fdd6e91ccec0663d80fa567eada14df", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.6039318165324576, "ground_truth": 0}, {"key": "bf1a3fd65fdd6e91ccec0663d80fa567eada14df", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.6584174660525188, "ground_truth": 0}, {"key": "bf1a3fd65fdd6e91ccec0663d80fa567eada14df", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.6943026875946722, "ground_truth": 0}, {"key": "bf1a3fd65fdd6e91ccec0663d80fa567eada14df", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.6992544285835309, "ground_truth": 0}, {"key": "a0bd3047a6de80e3924843f1961ce28347c6a548", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.5370413763050849, "ground_truth": 0}, {"key": "a0bd3047a6de80e3924843f1961ce28347c6a548", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.8459424405816676, "ground_truth": 0}, {"key": "a0bd3047a6de80e3924843f1961ce28347c6a548", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.7341195209963582, "ground_truth": 0}, {"key": "a0bd3047a6de80e3924843f1961ce28347c6a548", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.43590152029288987, "ground_truth": 0}, {"key": "a0bd3047a6de80e3924843f1961ce28347c6a548", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.5679366056734315, "ground_truth": 0}, {"key": "090d322e93af624203dbd5dc83403170071c9e6a", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.6636689551146977, "ground_truth": 0}, {"key": "090d322e93af624203dbd5dc83403170071c9e6a", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.9224823475525947, "ground_truth": 0}, {"key": "090d322e93af624203dbd5dc83403170071c9e6a", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.744656360273156, "ground_truth": 0}, {"key": "090d322e93af624203dbd5dc83403170071c9e6a", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.7969253688801495, "ground_truth": 0}, {"key": "090d322e93af624203dbd5dc83403170071c9e6a", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.8548846312901515, "ground_truth": 0}, {"key": "ed5179817cb8f597a760800fcdce2b8e64fd30dc", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.5409238764971804, "ground_truth": 0}, {"key": "ed5179817cb8f597a760800fcdce2b8e64fd30dc", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.5964331548936387, "ground_truth": 0}, {"key": "ed5179817cb8f597a760800fcdce2b8e64fd30dc", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.3007455816943416, "ground_truth": 0}, {"key": "ed5179817cb8f597a760800fcdce2b8e64fd30dc", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.3415825278390436, "ground_truth": 0}, {"key": "ed5179817cb8f597a760800fcdce2b8e64fd30dc", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.5832033203958061, "ground_truth": 0}, {"key": "571a8023d0deed8c667dd41fed88290309e56927", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.12852513003016286, "ground_truth": 0}, {"key": "571a8023d0deed8c667dd41fed88290309e56927", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.39793843424268593, "ground_truth": 0}, {"key": "571a8023d0deed8c667dd41fed88290309e56927", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.18952109856754884, "ground_truth": 0}, {"key": "571a8023d0deed8c667dd41fed88290309e56927", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.17217185998140005, "ground_truth": 0}, {"key": "571a8023d0deed8c667dd41fed88290309e56927", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.4148988431988562, "ground_truth": 0}, {"key": "544d7c0cba7df38cc8dda8d0d91c6845cf5f52bb", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.3468731009572102, "ground_truth": 0}, {"key": "544d7c0cba7df38cc8dda8d0d91c6845cf5f52bb", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.45132649780309625, "ground_truth": 0}, {"key": "544d7c0cba7df38cc8dda8d0d91c6845cf5f52bb", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.4882834071120368, "ground_truth": 0}, {"key": "544d7c0cba7df38cc8dda8d0d91c6845cf5f52bb", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.5350984205925549, "ground_truth": 0}, {"key": "544d7c0cba7df38cc8dda8d0d91c6845cf5f52bb", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.8044059260094527, "ground_truth": 0}, {"key": "cbd3a0715a91ac8f651aa7b1f2c1fb37a2ef8a69", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.44167300800530257, "ground_truth": 0}, {"key": "cbd3a0715a91ac8f651aa7b1f2c1fb37a2ef8a69", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.5506073484966585, "ground_truth": 0}, {"key": "cbd3a0715a91ac8f651aa7b1f2c1fb37a2ef8a69", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.7138307565229689, "ground_truth": 0}, {"key": "cbd3a0715a91ac8f651aa7b1f2c1fb37a2ef8a69", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.6442251107560434, "ground_truth": 0}, {"key": "cbd3a0715a91ac8f651aa7b1f2c1fb37a2ef8a69", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.7620701048485826, "ground_truth": 0}, {"key": "4ca8b3cf75948dffea7b96e71bf1d9621107354b", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.9575961726901073, "ground_truth": 0}, {"key": "4ca8b3cf75948dffea7b96e71bf1d9621107354b", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.9309620696847057, "ground_truth": 0}, {"key": "4ca8b3cf75948dffea7b96e71bf1d9621107354b", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.8976952963285076, "ground_truth": 0}, {"key": "4ca8b3cf75948dffea7b96e71bf1d9621107354b", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.9348724558206547, "ground_truth": 0}, {"key": "4ca8b3cf75948dffea7b96e71bf1d9621107354b", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.834406884346263, "ground_truth": 0}, {"key": "98f04e49605f36e0236b206fcb26a1549a7c00c6", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.5117166039236134, "ground_truth": 0}, {"key": "98f04e49605f36e0236b206fcb26a1549a7c00c6", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.7490871912915903, "ground_truth": 0}, {"key": "98f04e49605f36e0236b206fcb26a1549a7c00c6", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.8116760144785645, "ground_truth": 0}, {"key": "98f04e49605f36e0236b206fcb26a1549a7c00c6", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.7772998541061196, "ground_truth": 0}, {"key": "98f04e49605f36e0236b206fcb26a1549a7c00c6", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.7839884644809039, "ground_truth": 0}, {"key": "fb0003754a764d7f3252120de58b515d1f882556", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.6859494449321352, "ground_truth": 0}, {"key": "fb0003754a764d7f3252120de58b515d1f882556", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.6548947080407312, "ground_truth": 0}, {"key": "fb0003754a764d7f3252120de58b515d1f882556", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.6943026853812567, "ground_truth": 0}, {"key": "fb0003754a764d7f3252120de58b515d1f882556", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.6150878465839611, "ground_truth": 0}, {"key": "fb0003754a764d7f3252120de58b515d1f882556", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.6548947070617375, "ground_truth": 0}, {"key": "0130f10c1d700cf42cad5fd24b242667342c86be", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.5039061630532568, "ground_truth": 0}, {"key": "0130f10c1d700cf42cad5fd24b242667342c86be", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.4726834853855521, "ground_truth": 0}, {"key": "0130f10c1d700cf42cad5fd24b242667342c86be", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.3886180332535318, "ground_truth": 0}, {"key": "0130f10c1d700cf42cad5fd24b242667342c86be", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.3720487763197656, "ground_truth": 0}, {"key": "0130f10c1d700cf42cad5fd24b242667342c86be", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.4455295424519171, "ground_truth": 0}, {"key": "fb8431bc320c2c1a6c32699da0fdae228ed8d73b", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.5563995617405965, "ground_truth": 0}, {"key": "fb8431bc320c2c1a6c32699da0fdae228ed8d73b", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.5, "ground_truth": 0}, {"key": "fb8431bc320c2c1a6c32699da0fdae228ed8d73b", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.4960938473460815, "ground_truth": 0}, {"key": "fb8431bc320c2c1a6c32699da0fdae228ed8d73b", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.7401743583859938, "ground_truth": 0}, {"key": "fb8431bc320c2c1a6c32699da0fdae228ed8d73b", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.4765796469035069, "ground_truth": 0}, {"key": "875d564015e85f88103edf0b36ce10e292334902", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.7490872005555508, "ground_truth": 0}, {"key": "875d564015e85f88103edf0b36ce10e292334902", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.7620701307957283, "ground_truth": 0}, {"key": "875d564015e85f88103edf0b36ce10e292334902", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.8539127506132197, "ground_truth": 0}, {"key": "875d564015e85f88103edf0b36ce10e292334902", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.6859494620720908, "ground_truth": 0}, {"key": "875d564015e85f88103edf0b36ce10e292334902", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.7138307544558411, "ground_truth": 0}, {"key": "53102b470b50905c033a90940fc6fa87190f7343", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.5312093932230413, "ground_truth": 0}, {"key": "53102b470b50905c033a90940fc6fa87190f7343", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.6388352691711403, "ground_truth": 0}, {"key": "53102b470b50905c033a90940fc6fa87190f7343", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.6671476571665722, "ground_truth": 0}, {"key": "53102b470b50905c033a90940fc6fa87190f7343", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.8152324807504212, "ground_truth": 0}, {"key": "53102b470b50905c033a90940fc6fa87190f7343", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.3830641803173087, "ground_truth": 0}, {"key": "58776b77856719aff45f09e50d370f52c756dc10", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.9019206785304875, "ground_truth": 0}, {"key": "58776b77856719aff45f09e50d370f52c756dc10", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.8428631479317068, "ground_truth": 0}, {"key": "58776b77856719aff45f09e50d370f52c756dc10", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.7201715041308433, "ground_truth": 0}, {"key": "58776b77856719aff45f09e50d370f52c756dc10", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.7662936368378662, "ground_truth": 0}, {"key": "58776b77856719aff45f09e50d370f52c756dc10", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.9224823406654038, "ground_truth": 0}, {"key": "1b1479bb6e290e86e4b2a1e862e06909a0a62f8e", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.29421496176457984, "ground_truth": 0}, {"key": "1b1479bb6e290e86e4b2a1e862e06909a0a62f8e", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.4726834654291034, "ground_truth": 0}, {"key": "1b1479bb6e290e86e4b2a1e862e06909a0a62f8e", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.4378234923442439, "ground_truth": 0}, {"key": "1b1479bb6e290e86e4b2a1e862e06909a0a62f8e", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.312369993402915, "ground_truth": 0}, {"key": "1b1479bb6e290e86e4b2a1e862e06909a0a62f8e", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.3757064887440498, "ground_truth": 0}, {"key": "137019bb8262f8ab776ec6367a0ae4b020fa638e", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.48242911325630516, "ground_truth": 0}, {"key": "137019bb8262f8ab776ec6367a0ae4b020fa638e", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.29746994495834594, "ground_truth": 0}, {"key": "137019bb8262f8ab776ec6367a0ae4b020fa638e", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.24364244591130071, "ground_truth": 0}, {"key": "137019bb8262f8ab776ec6367a0ae4b020fa638e", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.5621764843616155, "ground_truth": 0}, {"key": "137019bb8262f8ab776ec6367a0ae4b020fa638e", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.3702253746103182, "ground_truth": 0}, {"key": "1f738e018a3a193d04ec22612e4fe6b01b4969fe", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.7520125640893979, "ground_truth": 0}, {"key": "1f738e018a3a193d04ec22612e4fe6b01b4969fe", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.6315942900227215, "ground_truth": 0}, {"key": "1f738e018a3a193d04ec22612e4fe6b01b4969fe", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.6206216008930936, "ground_truth": 0}, {"key": "1f738e018a3a193d04ec22612e4fe6b01b4969fe", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.7090191309659628, "ground_truth": 0}, {"key": "1f738e018a3a193d04ec22612e4fe6b01b4969fe", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.7295197851813372, "ground_truth": 0}, {"key": "2bb7b7d5a229ccb9c9b5b4fa1475a54297fc0a25", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.8198933262484357, "ground_truth": 0}, {"key": "2bb7b7d5a229ccb9c9b5b4fa1475a54297fc0a25", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.707404677518444, "ground_truth": 0}, {"key": "2bb7b7d5a229ccb9c9b5b4fa1475a54297fc0a25", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.8449215273857738, "ground_truth": 0}, {"key": "2bb7b7d5a229ccb9c9b5b4fa1475a54297fc0a25", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.8705972628073598, "ground_truth": 0}, {"key": "2bb7b7d5a229ccb9c9b5b4fa1475a54297fc0a25", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.793105936772849, "ground_truth": 0}, {"key": "c136c209869b227e534aca60b6df7e0b26bce7fe", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.8757869923400736, "ground_truth": 0}, {"key": "c136c209869b227e534aca60b6df7e0b26bce7fe", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.8558511491157759, "ground_truth": 0}, {"key": "c136c209869b227e534aca60b6df7e0b26bce7fe", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.6261241661218923, "ground_truth": 0}, {"key": "c136c209869b227e534aca60b6df7e0b26bce7fe", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.8587185941256567, "ground_truth": 0}, {"key": "c136c209869b227e534aca60b6df7e0b26bce7fe", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.7025300538945812, "ground_truth": 0}, {"key": "bfbf2be3d5b9da8425253502393528d0f95d2b5d", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.4130035760253296, "ground_truth": 0}, {"key": "bfbf2be3d5b9da8425253502393528d0f95d2b5d", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.9079671427611348, "ground_truth": 0}, {"key": "bfbf2be3d5b9da8425253502393528d0f95d2b5d", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.7217432057178754, "ground_truth": 0}, {"key": "bfbf2be3d5b9da8425253502393528d0f95d2b5d", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.5983122046354894, "ground_truth": 0}, {"key": "bfbf2be3d5b9da8425253502393528d0f95d2b5d", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.496093826808595, "ground_truth": 0}, {"key": "de149988c9768a12f4a656f1d86efe42af51b4c8", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.6636689721885027, "ground_truth": 0}, {"key": "de149988c9768a12f4a656f1d86efe42af51b4c8", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.7371581343419629, "ground_truth": 0}, {"key": "de149988c9768a12f4a656f1d86efe42af51b4c8", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.6976089058968201, "ground_truth": 0}, {"key": "de149988c9768a12f4a656f1d86efe42af51b4c8", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.8278281503278374, "ground_truth": 0}, {"key": "de149988c9768a12f4a656f1d86efe42af51b4c8", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.7676898431930972, "ground_truth": 0}, {"key": "45986f43dd61461844801c08c8753a71ccbf9083", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.8489721910004798, "ground_truth": 0}, {"key": "45986f43dd61461844801c08c8753a71ccbf9083", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.7325918404867696, "ground_truth": 0}, {"key": "45986f43dd61461844801c08c8753a71ccbf9083", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.6132365802724365, "ground_truth": 0}, {"key": "45986f43dd61461844801c08c8753a71ccbf9083", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.8407826022963767, "ground_truth": 0}, {"key": "45986f43dd61461844801c08c8753a71ccbf9083", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.854884647936976, "ground_truth": 0}, {"key": "e27256e1314f48219ceca70c273dd8429fc4ca4f", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.7476159550758551, "ground_truth": 0}, {"key": "e27256e1314f48219ceca70c273dd8429fc4ca4f", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.600188350018302, "ground_truth": 0}, {"key": "e27256e1314f48219ceca70c273dd8429fc4ca4f", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.7386690756633985, "ground_truth": 0}, {"key": "e27256e1314f48219ceca70c273dd8429fc4ca4f", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.3575675126623885, "ground_truth": 0}, {"key": "e27256e1314f48219ceca70c273dd8429fc4ca4f", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.8031737934652701, "ground_truth": 0}, {"key": "8da9fddf6f4a0d798e454ee7b778ce0d7ce3c447", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.7185944069794065, "ground_truth": 0}, {"key": "8da9fddf6f4a0d798e454ee7b778ce0d7ce3c447", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.5964331295039187, "ground_truth": 0}, {"key": "8da9fddf6f4a0d798e454ee7b778ce0d7ce3c447", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.537041385190087, "ground_truth": 0}, {"key": "8da9fddf6f4a0d798e454ee7b778ce0d7ce3c447", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.6169358087136045, "ground_truth": 0}, {"key": "8da9fddf6f4a0d798e454ee7b778ce0d7ce3c447", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.6388352853929953, "ground_truth": 0}, {"key": "d2e357c372891291bbdb4f496792ea9d5807cd3a", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.8774767941012631, "ground_truth": 0}, {"key": "d2e357c372891291bbdb4f496792ea9d5807cd3a", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.8509646953086301, "ground_truth": 0}, {"key": "d2e357c372891291bbdb4f496792ea9d5807cd3a", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.727975459323552, "ground_truth": 0}, {"key": "d2e357c372891291bbdb4f496792ea9d5807cd3a", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.8902942295463242, "ground_truth": 0}, {"key": "d2e357c372891291bbdb4f496792ea9d5807cd3a", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.7386690866086394, "ground_truth": 0}, {"key": "2a17cad6a35f54ceab81d03772a75c58aa7147ef", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.3867634320253971, "ground_truth": 0}, {"key": "2a17cad6a35f54ceab81d03772a75c58aa7147ef", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.40168779680184163, "ground_truth": 0}, {"key": "2a17cad6a35f54ceab81d03772a75c58aa7147ef", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.48633153397505585, "ground_truth": 0}, {"key": "2a17cad6a35f54ceab81d03772a75c58aa7147ef", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.33458944268402513, "ground_truth": 0}, {"key": "2a17cad6a35f54ceab81d03772a75c58aa7147ef", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.31405054065991367, "ground_truth": 0}, {"key": "4b25022fda48e7f91ab1459f1a6dca501318672e", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.4649015728316471, "ground_truth": 0}, {"key": "4b25022fda48e7f91ab1459f1a6dca501318672e", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.5292634027279285, "ground_truth": 0}, {"key": "4b25022fda48e7f91ab1459f1a6dca501318672e", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.48242911309891, "ground_truth": 0}, {"key": "4b25022fda48e7f91ab1459f1a6dca501318672e", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.6406358415334072, "ground_truth": 0}, {"key": "4b25022fda48e7f91ab1459f1a6dca501318672e", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.33285234042971884, "ground_truth": 0}, {"key": "62066d76f4ef9e06a1129551c41371bb5d2f7465", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.7386690667973067, "ground_truth": 0}, {"key": "62066d76f4ef9e06a1129551c41371bb5d2f7465", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.8568122974168567, "ground_truth": 0}, {"key": "62066d76f4ef9e06a1129551c41371bb5d2f7465", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.8624675217364882, "ground_truth": 0}, {"key": "62066d76f4ef9e06a1129551c41371bb5d2f7465", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.7718435135066071, "ground_truth": 0}, {"key": "62066d76f4ef9e06a1129551c41371bb5d2f7465", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.8791467698218265, "ground_truth": 0}, {"key": "16c4a27e42066259797d93d5db0239bce0a15f18", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.7759445597560596, "ground_truth": 0}, {"key": "16c4a27e42066259797d93d5db0239bce0a15f18", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.8596637509647927, "ground_truth": 0}, {"key": "16c4a27e42066259797d93d5db0239bce0a15f18", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.7786492983049701, "ground_truth": 0}, {"key": "16c4a27e42066259797d93d5db0239bce0a15f18", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.6261242068936348, "ground_truth": 0}, {"key": "16c4a27e42066259797d93d5db0239bce0a15f18", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.7154240033813, "ground_truth": 0}, {"key": "8626e8d0c96f4d12eca92423e0c43c6ea3e53545", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.6654105391520523, "ground_truth": 0}, {"key": "8626e8d0c96f4d12eca92423e0c43c6ea3e53545", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.7839884450193954, "ground_truth": 0}, {"key": "8626e8d0c96f4d12eca92423e0c43c6ea3e53545", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.7233094672932475, "ground_truth": 0}, {"key": "8626e8d0c96f4d12eca92423e0c43c6ea3e53545", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.6566582591843181, "ground_truth": 0}, {"key": "8626e8d0c96f4d12eca92423e0c43c6ea3e53545", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.7154239932630022, "ground_truth": 0}, {"key": "f675d806e17d1920e6622d3a925367697c94e58e", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.8568122936102525, "ground_truth": 0}, {"key": "f675d806e17d1920e6622d3a925367697c94e58e", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.6876299932392947, "ground_truth": 0}, {"key": "f675d806e17d1920e6622d3a925367697c94e58e", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.7745833869956553, "ground_truth": 0}, {"key": "f675d806e17d1920e6622d3a925367697c94e58e", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.53120937406725, "ground_truth": 0}, {"key": "f675d806e17d1920e6622d3a925367697c94e58e", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.7772998476276336, "ground_truth": 0}, {"key": "835b6e4637bd2c3fe2644f2cefa00270e950ebdf", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.4513264993562114, "ground_truth": 0}, {"key": "835b6e4637bd2c3fe2644f2cefa00270e950ebdf", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.7325918494844624, "ground_truth": 0}, {"key": "835b6e4637bd2c3fe2644f2cefa00270e950ebdf", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.6513548661089723, "ground_truth": 0}, {"key": "835b6e4637bd2c3fe2644f2cefa00270e950ebdf", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.6297746257857318, "ground_truth": 0}, {"key": "835b6e4637bd2c3fe2644f2cefa00270e950ebdf", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.6740504804043651, "ground_truth": 0}, {"key": "aec90720358f66b9d149db8afd08fbb821e3aa52", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.5156199204829981, "ground_truth": 0}, {"key": "aec90720358f66b9d149db8afd08fbb821e3aa52", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.7732163785192698, "ground_truth": 0}, {"key": "aec90720358f66b9d149db8afd08fbb821e3aa52", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.4225046449329409, "ground_truth": 0}, {"key": "aec90720358f66b9d149db8afd08fbb821e3aa52", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.5097643920784909, "ground_truth": 0}, {"key": "aec90720358f66b9d149db8afd08fbb821e3aa52", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.8365545544727299, "ground_truth": 0}, {"key": "0033829349643e2964a8c3ce5fd997116ce43f7c", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.7170118726836435, "ground_truth": 0}, {"key": "0033829349643e2964a8c3ce5fd997116ce43f7c", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.5888891460567554, "ground_truth": 0}, {"key": "0033829349643e2964a8c3ce5fd997116ce43f7c", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.6352224462543433, "ground_truth": 0}, {"key": "0033829349643e2964a8c3ce5fd997116ce43f7c", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.759225403300948, "ground_truth": 0}, {"key": "0033829349643e2964a8c3ce5fd997116ce43f7c", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.8606036259880819, "ground_truth": 0}, {"key": "3276a47234f0aa9eb7d4d06940ffb912be059454", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.7170118770710062, "ground_truth": 0}, {"key": "3276a47234f0aa9eb7d4d06940ffb912be059454", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.6909763080263669, "ground_truth": 0}, {"key": "3276a47234f0aa9eb7d4d06940ffb912be059454", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.773216344347497, "ground_truth": 0}, {"key": "3276a47234f0aa9eb7d4d06940ffb912be059454", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.7853085805399758, "ground_truth": 0}, {"key": "3276a47234f0aa9eb7d4d06940ffb912be059454", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.7606506373424771, "ground_truth": 0}, {"key": "8d3bb51d711ce00e3fff53625a70923985573834", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.47073660239137916, "ground_truth": 0}, {"key": "8d3bb51d711ce00e3fff53625a70923985573834", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.4863315137001381, "ground_truth": 0}, {"key": "8d3bb51d711ce00e3fff53625a70923985573834", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.651354899980853, "ground_truth": 0}, {"key": "8d3bb51d711ce00e3fff53625a70923985573834", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.5156199221369372, "ground_truth": 0}, {"key": "8d3bb51d711ce00e3fff53625a70923985573834", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.4455295202855661, "ground_truth": 0}, {"key": "e43fc7e34d05a75894279f55935b25040a6d7017", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.4843800807169631, "ground_truth": 0}, {"key": "e43fc7e34d05a75894279f55935b25040a6d7017", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.3328523263033983, "ground_truth": 0}, {"key": "e43fc7e34d05a75894279f55935b25040a6d7017", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.4301473374818106, "ground_truth": 0}, {"key": "e43fc7e34d05a75894279f55935b25040a6d7017", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.24653335546182864, "ground_truth": 0}, {"key": "e43fc7e34d05a75894279f55935b25040a6d7017", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.5389832124243013, "ground_truth": 0}, {"key": "518daa3f4d9f4eb8d3e6dec7852c8b645d1ceb49", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.4649015699107066, "ground_truth": 0}, {"key": "518daa3f4d9f4eb8d3e6dec7852c8b645d1ceb49", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.7892337080576531, "ground_truth": 0}, {"key": "518daa3f4d9f4eb8d3e6dec7852c8b645d1ceb49", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.49414089438987385, "ground_truth": 0}, {"key": "518daa3f4d9f4eb8d3e6dec7852c8b645d1ceb49", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.3363310552758994, "ground_truth": 0}, {"key": "518daa3f4d9f4eb8d3e6dec7852c8b645d1ceb49", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.3775406634094233, "ground_truth": 0}, {"key": "a86f10b66912e0221e9ad4d44c37fc7f4e138ed2", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.9585377257333535, "ground_truth": 0}, {"key": "a86f10b66912e0221e9ad4d44c37fc7f4e138ed2", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.9873750503089094, "ground_truth": 0}, {"key": "a86f10b66912e0221e9ad4d44c37fc7f4e138ed2", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.9796676468929197, "ground_truth": 0}, {"key": "a86f10b66912e0221e9ad4d44c37fc7f4e138ed2", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.9802808729163968, "ground_truth": 0}, {"key": "a86f10b66912e0221e9ad4d44c37fc7f4e138ed2", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.9635062338632728, "ground_truth": 0}, {"key": "a34829c5a83a3ef39c34b57b65cc48c9bf11f14b", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.5292634039134833, "ground_truth": 0}, {"key": "a34829c5a83a3ef39c34b57b65cc48c9bf11f14b", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.4843800817450301, "ground_truth": 0}, {"key": "a34829c5a83a3ef39c34b57b65cc48c9bf11f14b", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.6601723909518933, "ground_truth": 0}, {"key": "a34829c5a83a3ef39c34b57b65cc48c9bf11f14b", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.5175708685840253, "ground_truth": 0}, {"key": "a34829c5a83a3ef39c34b57b65cc48c9bf11f14b", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.5813030711779875, "ground_truth": 0}, {"key": "05c6b2a21f9c0ffd5f0c76c9ce4c6d3d875fcf39", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.5736783774660194, "ground_truth": 0}, {"key": "05c6b2a21f9c0ffd5f0c76c9ce4c6d3d875fcf39", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.8068526098762425, "ground_truth": 0}, {"key": "05c6b2a21f9c0ffd5f0c76c9ce4c6d3d875fcf39", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.4551985655708582, "ground_truth": 0}, {"key": "05c6b2a21f9c0ffd5f0c76c9ce4c6d3d875fcf39", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.4668455980018724, "ground_truth": 0}, {"key": "05c6b2a21f9c0ffd5f0c76c9ce4c6d3d875fcf39", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.6279512132117501, "ground_truth": 0}, {"key": "b3e6507640b009ed51c8c8f8be85d0b7fec5b579", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.8529354733923128, "ground_truth": 0}, {"key": "b3e6507640b009ed51c8c8f8be85d0b7fec5b579", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.875786991164759, "ground_truth": 0}, {"key": "b3e6507640b009ed51c8c8f8be85d0b7fec5b579", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.9213576150735001, "ground_truth": 0}, {"key": "b3e6507640b009ed51c8c8f8be85d0b7fec5b579", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.7356416553554217, "ground_truth": 0}, {"key": "b3e6507640b009ed51c8c8f8be85d0b7fec5b579", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.884837772649824, "ground_truth": 0}, {"key": "6e930c55a62640d218e4b94f39cb7c83b6ad9117", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.2909808546720358, "ground_truth": 0}, {"key": "6e930c55a62640d218e4b94f39cb7c83b6ad9117", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.4148988447492737, "ground_truth": 0}, {"key": "6e930c55a62640d218e4b94f39cb7c83b6ad9117", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.25982564357505067, "ground_truth": 0}, {"key": "6e930c55a62640d218e4b94f39cb7c83b6ad9117", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.3276683009354184, "ground_truth": 0}, {"key": "6e930c55a62640d218e4b94f39cb7c83b6ad9117", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.46879061949782214, "ground_truth": 0}, {"key": "cd13c83364964da3b3659782e6ef0d2b3dc273b1", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.7866228262221008, "ground_truth": 0}, {"key": "cd13c83364964da3b3659782e6ef0d2b3dc273b1", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.7341195387722222, "ground_truth": 0}, {"key": "cd13c83364964da3b3659782e6ef0d2b3dc273b1", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.5698526454889683, "ground_truth": 0}, {"key": "cd13c83364964da3b3659782e6ef0d2b3dc273b1", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.6548947175796684, "ground_truth": 0}, {"key": "cd13c83364964da3b3659782e6ef0d2b3dc273b1", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.7813306364353397, "ground_truth": 0}, {"key": "328210eaa50ae54cc3d979958c1d2008faa27401", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.48438007715682807, "ground_truth": 0}, {"key": "328210eaa50ae54cc3d979958c1d2008faa27401", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.8344068879615437, "ground_truth": 0}, {"key": "328210eaa50ae54cc3d979958c1d2008faa27401", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.6584175157875349, "ground_truth": 0}, {"key": "328210eaa50ae54cc3d979958c1d2008faa27401", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.7704647822075954, "ground_truth": 0}, {"key": "328210eaa50ae54cc3d979958c1d2008faa27401", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.5350984167340179, "ground_truth": 0}, {"key": "b67b63d1da9cccd6e229d5755065d57dd1653feb", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.7201715279119181, "ground_truth": 0}, {"key": "b67b63d1da9cccd6e229d5755065d57dd1653feb", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.796925370633047, "ground_truth": 0}, {"key": "b67b63d1da9cccd6e229d5755065d57dd1653feb", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.7718434870503894, "ground_truth": 0}, {"key": "b67b63d1da9cccd6e229d5755065d57dd1653feb", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.7008948175986168, "ground_truth": 0}, {"key": "b67b63d1da9cccd6e229d5755065d57dd1653feb", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.4436004263696401, "ground_truth": 0}, {"key": "e4c55cb4bb6e5418d8486fb7c9369b6c84b2716d", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.6388352714419357, "ground_truth": 0}, {"key": "e4c55cb4bb6e5418d8486fb7c9369b6c84b2716d", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.5813031056402329, "ground_truth": 0}, {"key": "e4c55cb4bb6e5418d8486fb7c9369b6c84b2716d", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.6566582455466222, "ground_truth": 0}, {"key": "e4c55cb4bb6e5418d8486fb7c9369b6c84b2716d", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.5506073717797502, "ground_truth": 0}, {"key": "e4c55cb4bb6e5418d8486fb7c9369b6c84b2716d", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.5156199044993249, "ground_truth": 0}, {"key": "544b165ad1d22a5dcbbab469a2aa7666c2868361", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.4746311641842928, "ground_truth": 0}, {"key": "544b165ad1d22a5dcbbab469a2aa7666c2868361", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.5945512536634494, "ground_truth": 0}, {"key": "544b165ad1d22a5dcbbab469a2aa7666c2868361", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.44939264665674344, "ground_truth": 0}, {"key": "544b165ad1d22a5dcbbab469a2aa7666c2868361", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.5506073712601672, "ground_truth": 0}, {"key": "544b165ad1d22a5dcbbab469a2aa7666c2868361", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.6893056066865408, "ground_truth": 0}, {"key": "2577ef64a22c06cf63cb244abfad9ecc46603208", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.615087871205552, "ground_truth": 0}, {"key": "2577ef64a22c06cf63cb244abfad9ecc46603208", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.6001883444282992, "ground_truth": 0}, {"key": "2577ef64a22c06cf63cb244abfad9ecc46603208", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.5292633902050838, "ground_truth": 0}, {"key": "2577ef64a22c06cf63cb244abfad9ecc46603208", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.5389832012761999, "ground_truth": 0}, {"key": "2577ef64a22c06cf63cb244abfad9ecc46603208", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.7577943655403699, "ground_truth": 0}, {"key": "2a73430dd3232ad3da7570a5ac133d7f29a6b6c6", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.8824278727685455, "ground_truth": 0}, {"key": "2a73430dd3232ad3da7570a5ac133d7f29a6b6c6", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.822189128969379, "ground_truth": 0}, {"key": "2a73430dd3232ad3da7570a5ac133d7f29a6b6c6", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.8740772300587024, "ground_truth": 0}, {"key": "2a73430dd3232ad3da7570a5ac133d7f29a6b6c6", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.663668947884882, "ground_truth": 0}, {"key": "2a73430dd3232ad3da7570a5ac133d7f29a6b6c6", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.8984105520637164, "ground_truth": 0}, {"key": "8fbcaf3abc124b7baaa278d382411f43e7e48353", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.501953117153085, "ground_truth": 0}, {"key": "8fbcaf3abc124b7baaa278d382411f43e7e48353", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.42250462287738305, "ground_truth": 0}, {"key": "8fbcaf3abc124b7baaa278d382411f43e7e48353", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.3629691969535065, "ground_truth": 0}, {"key": "8fbcaf3abc124b7baaa278d382411f43e7e48353", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.5964331376022999, "ground_truth": 0}, {"key": "8fbcaf3abc124b7baaa278d382411f43e7e48353", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.37754064413361815, "ground_truth": 0}, {"key": "bc04e5a298854589044eb5a162f281f3e7e12c16", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.1895210895135648, "ground_truth": 0}, {"key": "bc04e5a298854589044eb5a162f281f3e7e12c16", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.21601153427355918, "ground_truth": 0}, {"key": "bc04e5a298854589044eb5a162f281f3e7e12c16", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.18476751104161007, "ground_truth": 0}, {"key": "bc04e5a298854589044eb5a162f281f3e7e12c16", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.15921739990156758, "ground_truth": 0}, {"key": "bc04e5a298854589044eb5a162f281f3e7e12c16", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.2689414316550961, "ground_truth": 0}, {"key": "8c3b7358950d0684a90736fc39d08340d3ec41ee", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.41489883253968735, "ground_truth": 0}, {"key": "8c3b7358950d0684a90736fc39d08340d3ec41ee", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.3191213769254504, "ground_truth": 0}, {"key": "8c3b7358950d0684a90736fc39d08340d3ec41ee", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.43206340108861024, "ground_truth": 0}, {"key": "8c3b7358950d0684a90736fc39d08340d3ec41ee", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.4111108603218082, "ground_truth": 0}, {"key": "8c3b7358950d0684a90736fc39d08340d3ec41ee", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.289371716234665, "ground_truth": 0}, {"key": "d1a86381ca59e3471d2863688229922f83218150", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.5214711563861544, "ground_truth": 0}, {"key": "d1a86381ca59e3471d2863688229922f83218150", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.8624675314752552, "ground_truth": 0}, {"key": "d1a86381ca59e3471d2863688229922f83218150", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.5563995741627216, "ground_truth": 0}, {"key": "d1a86381ca59e3471d2863688229922f83218150", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.5292633986794094, "ground_truth": 0}, {"key": "d1a86381ca59e3471d2863688229922f83218150", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.6566582479009043, "ground_truth": 0}, {"key": "313d98f4c6047ff556795b6da47e42e9f650946a", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.6132365458776237, "ground_truth": 0}, {"key": "313d98f4c6047ff556795b6da47e42e9f650946a", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.6187804148387455, "ground_truth": 0}, {"key": "313d98f4c6047ff556795b6da47e42e9f650946a", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.39981166704742455, "ground_truth": 0}, {"key": "313d98f4c6047ff556795b6da47e42e9f650946a", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.3886180171154472, "ground_truth": 0}, {"key": "313d98f4c6047ff556795b6da47e42e9f650946a", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.5195213177142806, "ground_truth": 0}, {"key": "8c0934c689bbc9234dc51eff9d8d156aec106ca4", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.7786493023833617, "ground_truth": 0}, {"key": "8c0934c689bbc9234dc51eff9d8d156aec106ca4", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.6477982224873657, "ground_truth": 0}, {"key": "8c0934c689bbc9234dc51eff9d8d156aec106ca4", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.5602526358101171, "ground_truth": 0}, {"key": "8c0934c689bbc9234dc51eff9d8d156aec106ca4", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.7295197786355214, "ground_truth": 0}, {"key": "8c0934c689bbc9234dc51eff9d8d156aec106ca4", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.7892336867420842, "ground_truth": 0}, {"key": "70f210b63211c32ab22354506b7bd9b80ee194af", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.35220176064143316, "ground_truth": 0}, {"key": "70f210b63211c32ab22354506b7bd9b80ee194af", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.4416730135273543, "ground_truth": 0}, {"key": "70f210b63211c32ab22354506b7bd9b80ee194af", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.39233683839883593, "ground_truth": 0}, {"key": "70f210b63211c32ab22354506b7bd9b80ee194af", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.4726834647304873, "ground_truth": 0}, {"key": "70f210b63211c32ab22354506b7bd9b80ee194af", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.4707366266184251, "ground_truth": 0}, {"key": "dea4bf4a53b568dea8b3d5009a24d090485be8c9", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.7563575563757247, "ground_truth": 0}, {"key": "dea4bf4a53b568dea8b3d5009a24d090485be8c9", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.5175709031409496, "ground_truth": 0}, {"key": "dea4bf4a53b568dea8b3d5009a24d090485be8c9", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.6206216020920597, "ground_truth": 0}, {"key": "dea4bf4a53b568dea8b3d5009a24d090485be8c9", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.8354835431601724, "ground_truth": 0}, {"key": "dea4bf4a53b568dea8b3d5009a24d090485be8c9", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.694302668201399, "ground_truth": 0}, {"key": "3ffb4210cf832dc039ffe7522c47c6eb7a5e5ab5", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.6442250964430576, "ground_truth": 0}, {"key": "3ffb4210cf832dc039ffe7522c47c6eb7a5e5ab5", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.6352224411903042, "ground_truth": 0}, {"key": "3ffb4210cf832dc039ffe7522c47c6eb7a5e5ab5", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.7170118611593859, "ground_truth": 0}, {"key": "3ffb4210cf832dc039ffe7522c47c6eb7a5e5ab5", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.6959583274002598, "ground_truth": 0}, {"key": "3ffb4210cf832dc039ffe7522c47c6eb7a5e5ab5", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.7772998620782322, "ground_truth": 0}, {"key": "c010d72bf64ac4e1c758b7f078aeed89bc57a9db", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.7217432061851764, "ground_truth": 0}, {"key": "c010d72bf64ac4e1c758b7f078aeed89bc57a9db", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.5869964218713312, "ground_truth": 0}, {"key": "c010d72bf64ac4e1c758b7f078aeed89bc57a9db", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.49609383789104106, "ground_truth": 0}, {"key": "c010d72bf64ac4e1c758b7f078aeed89bc57a9db", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.7520125645540972, "ground_truth": 0}, {"key": "c010d72bf64ac4e1c758b7f078aeed89bc57a9db", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.6654105664845914, "ground_truth": 0}, {"key": "343644770a597a2dfa7548ba165fa9c6bdc88245", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.793105951600548, "ground_truth": 0}, {"key": "343644770a597a2dfa7548ba165fa9c6bdc88245", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.7905303076855761, "ground_truth": 0}, {"key": "343644770a597a2dfa7548ba165fa9c6bdc88245", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.5467381435247677, "ground_truth": 0}, {"key": "343644770a597a2dfa7548ba165fa9c6bdc88245", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.5214711606613233, "ground_truth": 0}, {"key": "343644770a597a2dfa7548ba165fa9c6bdc88245", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.8679338565074521, "ground_truth": 0}, {"key": "4b89e8a6a25de61d21a1fed20fb911cd4b1e4b47", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.6206216224624695, "ground_truth": 0}, {"key": "4b89e8a6a25de61d21a1fed20fb911cd4b1e4b47", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.4263216253946332, "ground_truth": 0}, {"key": "4b89e8a6a25de61d21a1fed20fb911cd4b1e4b47", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.7138307433110942, "ground_truth": 0}, {"key": "4b89e8a6a25de61d21a1fed20fb911cd4b1e4b47", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.5621764952368659, "ground_truth": 0}, {"key": "4b89e8a6a25de61d21a1fed20fb911cd4b1e4b47", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.7634837614185876, "ground_truth": 0}, {"key": "9b382d27692cb18aa61af350038b175b3ce75e2b", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.28937170649797833, "ground_truth": 0}, {"key": "9b382d27692cb18aa61af350038b175b3ce75e2b", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.1993080145064319, "ground_truth": 0}, {"key": "9b382d27692cb18aa61af350038b175b3ce75e2b", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.41300357408730637, "ground_truth": 0}, {"key": "9b382d27692cb18aa61af350038b175b3ce75e2b", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.217337515566575, "ground_truth": 0}, {"key": "9b382d27692cb18aa61af350038b175b3ce75e2b", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.31237002058930163, "ground_truth": 0}, {"key": "59be27355e5b86754678f70254cfbb1e6dc8bf0c", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.7813306415531975, "ground_truth": 0}, {"key": "59be27355e5b86754678f70254cfbb1e6dc8bf0c", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.63159432484774, "ground_truth": 0}, {"key": "59be27355e5b86754678f70254cfbb1e6dc8bf0c", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.6513548663509604, "ground_truth": 0}, {"key": "59be27355e5b86754678f70254cfbb1e6dc8bf0c", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.47268350126641223, "ground_truth": 0}, {"key": "59be27355e5b86754678f70254cfbb1e6dc8bf0c", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.6791786881659836, "ground_truth": 0}, {"key": "ff10934c1dc127286575fb1a6b192da6da21f235", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.7634837427731019, "ground_truth": 0}, {"key": "ff10934c1dc127286575fb1a6b192da6da21f235", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.74761594733775, "ground_truth": 0}, {"key": "ff10934c1dc127286575fb1a6b192da6da21f235", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.5869964337724732, "ground_truth": 0}, {"key": "ff10934c1dc127286575fb1a6b192da6da21f235", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.7057850314308416, "ground_truth": 0}, {"key": "ff10934c1dc127286575fb1a6b192da6da21f235", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.600188353057342, "ground_truth": 0}, {"key": "1997690ceabc952c3396cb2a30e9050241f6f6c7", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.5039061692309026, "ground_truth": 0}, {"key": "1997690ceabc952c3396cb2a30e9050241f6f6c7", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.28298813102958115, "ground_truth": 0}, {"key": "1997690ceabc952c3396cb2a30e9050241f6f6c7", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.4263215759321061, "ground_truth": 0}, {"key": "1997690ceabc952c3396cb2a30e9050241f6f6c7", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.39606816331484285, "ground_truth": 0}, {"key": "1997690ceabc952c3396cb2a30e9050241f6f6c7", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.4980468848465643, "ground_truth": 0}, {"key": "c676027eea6109621206e3864c4eea30912fe09f", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.5602526726830586, "ground_truth": 0}, {"key": "c676027eea6109621206e3864c4eea30912fe09f", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.22678362869686822, "ground_truth": 0}, {"key": "c676027eea6109621206e3864c4eea30912fe09f", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.3684057141425495, "ground_truth": 0}, {"key": "c676027eea6109621206e3864c4eea30912fe09f", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.5486734882502656, "ground_truth": 0}, {"key": "c676027eea6109621206e3864c4eea30912fe09f", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.5253688079300077, "ground_truth": 0}, {"key": "78e22dd79495204cf719e3728927241bb60b80e1", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.5467381447680095, "ground_truth": 0}, {"key": "78e22dd79495204cf719e3728927241bb60b80e1", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.5945512632100627, "ground_truth": 0}, {"key": "78e22dd79495204cf719e3728927241bb60b80e1", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.4493926264053346, "ground_truth": 0}, {"key": "78e22dd79495204cf719e3728927241bb60b80e1", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.40356687097338106, "ground_truth": 0}, {"key": "78e22dd79495204cf719e3728927241bb60b80e1", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.5156199051158857, "ground_truth": 0}, {"key": "6c1a1cf59028ba2567b0a1941e510c40133da1c0", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.5621764871565975, "ground_truth": 0}, {"key": "6c1a1cf59028ba2567b0a1941e510c40133da1c0", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.7416740298427763, "ground_truth": 0}, {"key": "6c1a1cf59028ba2567b0a1941e510c40133da1c0", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.4225046258696294, "ground_truth": 0}, {"key": "6c1a1cf59028ba2567b0a1941e510c40133da1c0", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.4882834108156224, "ground_truth": 0}, {"key": "6c1a1cf59028ba2567b0a1941e510c40133da1c0", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.7233094673915873, "ground_truth": 0}, {"key": "e8bbd5a77edf96611a4b8efcfbc625ec65985e98", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.5660185451874078, "ground_truth": 0}, {"key": "e8bbd5a77edf96611a4b8efcfbc625ec65985e98", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.540923861354885, "ground_truth": 0}, {"key": "e8bbd5a77edf96611a4b8efcfbc625ec65985e98", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.5409238640344168, "ground_truth": 0}, {"key": "e8bbd5a77edf96611a4b8efcfbc625ec65985e98", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.6352224404982543, "ground_truth": 0}, {"key": "e8bbd5a77edf96611a4b8efcfbc625ec65985e98", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.5234203694720503, "ground_truth": 0}, {"key": "4141e012912dbf29c5e792b8654a9a36094b468c", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.6688802508852815, "ground_truth": 0}, {"key": "4141e012912dbf29c5e792b8654a9a36094b468c", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.8104789168634544, "ground_truth": 0}, {"key": "4141e012912dbf29c5e792b8654a9a36094b468c", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.7122321897094301, "ground_truth": 0}, {"key": "4141e012912dbf29c5e792b8654a9a36094b468c", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.760650653940998, "ground_truth": 0}, {"key": "4141e012912dbf29c5e792b8654a9a36094b468c", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.7371581607634566, "ground_truth": 0}, {"key": "d80fa94dc14601e4b82321e2cf749d6915251a70", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.8365545693522175, "ground_truth": 0}, {"key": "d80fa94dc14601e4b82321e2cf749d6915251a70", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.7461389870511044, "ground_truth": 0}, {"key": "d80fa94dc14601e4b82321e2cf749d6915251a70", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.5717666037812917, "ground_truth": 0}, {"key": "d80fa94dc14601e4b82321e2cf749d6915251a70", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.804405927049302, "ground_truth": 0}, {"key": "d80fa94dc14601e4b82321e2cf749d6915251a70", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.7772998540207231, "ground_truth": 0}, {"key": "11e57b8ed79c4f4b110d81a5cd7152d42411c7a6", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.490235609120643, "ground_truth": 0}, {"key": "11e57b8ed79c4f4b110d81a5cd7152d42411c7a6", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.31912137769788274, "ground_truth": 0}, {"key": "11e57b8ed79c4f4b110d81a5cd7152d42411c7a6", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.4726834673078511, "ground_truth": 0}, {"key": "11e57b8ed79c4f4b110d81a5cd7152d42411c7a6", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.6001883504900278, "ground_truth": 0}, {"key": "11e57b8ed79c4f4b110d81a5cd7152d42411c7a6", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.7122321803064731, "ground_truth": 0}, {"key": "b55c390e81c5d1d4fa077338d9daaed8978f710b", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.6242935175374931, "ground_truth": 0}, {"key": "b55c390e81c5d1d4fa077338d9daaed8978f710b", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.4111108769774278, "ground_truth": 0}, {"key": "b55c390e81c5d1d4fa077338d9daaed8978f710b", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.5156199073237164, "ground_truth": 0}, {"key": "b55c390e81c5d1d4fa077338d9daaed8978f710b", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.7371581717147828, "ground_truth": 0}, {"key": "b55c390e81c5d1d4fa077338d9daaed8978f710b", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.7154239960045614, "ground_truth": 0}, {"key": "d46e1849cbbf875ccd018fd778fa6c433cab4694", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.7759445452596315, "ground_truth": 0}, {"key": "d46e1849cbbf875ccd018fd778fa6c433cab4694", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.7386690769962628, "ground_truth": 0}, {"key": "d46e1849cbbf875ccd018fd778fa6c433cab4694", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.58510116078335, "ground_truth": 0}, {"key": "d46e1849cbbf875ccd018fd778fa6c433cab4694", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.592666600663125, "ground_truth": 0}, {"key": "d46e1849cbbf875ccd018fd778fa6c433cab4694", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.6584174585415584, "ground_truth": 0}, {"key": "09b582acc63514f671628e1766ff7e99b258fe9a", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.5331543955091195, "ground_truth": 0}, {"key": "09b582acc63514f671628e1766ff7e99b258fe9a", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.4301473368936337, "ground_truth": 0}, {"key": "09b582acc63514f671628e1766ff7e99b258fe9a", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.5983121922707507, "ground_truth": 0}, {"key": "09b582acc63514f671628e1766ff7e99b258fe9a", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.726425609301501, "ground_truth": 0}, {"key": "09b582acc63514f671628e1766ff7e99b258fe9a", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.6334102590649684, "ground_truth": 0}, {"key": "c4afe4db222c094c40bb3f271e37e006bcbebf88", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.7154240090058148, "ground_truth": 0}, {"key": "c4afe4db222c094c40bb3f271e37e006bcbebf88", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.6113819883077382, "ground_truth": 0}, {"key": "c4afe4db222c094c40bb3f271e37e006bcbebf88", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.355774915794971, "ground_truth": 0}, {"key": "c4afe4db222c094c40bb3f271e37e006bcbebf88", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.5448014346858846, "ground_truth": 0}, {"key": "c4afe4db222c094c40bb3f271e37e006bcbebf88", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.23091976298610326, "ground_truth": 0}, {"key": "e21871892c63ec9638bf1bd3c3a1c3ebdae88796", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.8322366537646205, "ground_truth": 0}, {"key": "e21871892c63ec9638bf1bd3c3a1c3ebdae88796", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.749087208560299, "ground_truth": 0}, {"key": "e21871892c63ec9638bf1bd3c3a1c3ebdae88796", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.5621765109864374, "ground_truth": 0}, {"key": "e21871892c63ec9638bf1bd3c3a1c3ebdae88796", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.5926665917542941, "ground_truth": 0}, {"key": "e21871892c63ec9638bf1bd3c3a1c3ebdae88796", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.6671476766921015, "ground_truth": 0}, {"key": "065378e265a6d5ff38b2e6748ba66490cf8670a9", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.27982849309520785, "ground_truth": 0}, {"key": "065378e265a6d5ff38b2e6748ba66490cf8670a9", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.3539863053915384, "ground_truth": 0}, {"key": "065378e265a6d5ff38b2e6748ba66490cf8670a9", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.1259227610083082, "ground_truth": 0}, {"key": "065378e265a6d5ff38b2e6748ba66490cf8670a9", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.4513265191845346, "ground_truth": 0}, {"key": "065378e265a6d5ff38b2e6748ba66490cf8670a9", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.4073334061538188, "ground_truth": 0}, {"key": "5852e143b34cc30e94aed29193fc2e1dce37b1b1", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.6791786997698017, "ground_truth": 0}, {"key": "5852e143b34cc30e94aed29193fc2e1dce37b1b1", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.6959583231136847, "ground_truth": 0}, {"key": "5852e143b34cc30e94aed29193fc2e1dce37b1b1", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.5774953660625896, "ground_truth": 0}, {"key": "5852e143b34cc30e94aed29193fc2e1dce37b1b1", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.4746311956747712, "ground_truth": 0}, {"key": "5852e143b34cc30e94aed29193fc2e1dce37b1b1", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.6876299993171219, "ground_truth": 0}, {"key": "af76b4c33b65666487dcc07f75d37de03ff61207", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.8068526210609933, "ground_truth": 0}, {"key": "af76b4c33b65666487dcc07f75d37de03ff61207", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.6808786150859785, "ground_truth": 0}, {"key": "af76b4c33b65666487dcc07f75d37de03ff61207", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.33111973607330303, "ground_truth": 0}, {"key": "af76b4c33b65666487dcc07f75d37de03ff61207", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.7534666435303151, "ground_truth": 0}, {"key": "af76b4c33b65666487dcc07f75d37de03ff61207", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.6825737554222652, "ground_truth": 0}, {"key": "9918924dbaed44429c58ea3638c3847317b71127", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.5156199501476136, "ground_truth": 0}, {"key": "9918924dbaed44429c58ea3638c3847317b71127", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.5448013713850488, "ground_truth": 0}, {"key": "9918924dbaed44429c58ea3638c3847317b71127", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.7154240029530794, "ground_truth": 0}, {"key": "9918924dbaed44429c58ea3638c3847317b71127", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.6791787096862666, "ground_truth": 0}, {"key": "9918924dbaed44429c58ea3638c3847317b71127", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.6859494612664325, "ground_truth": 0}, {"key": "c87e99f422b46c03ce77e7cd064bff87c076e1ed", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.287767804854466, "ground_truth": 0}, {"key": "c87e99f422b46c03ce77e7cd064bff87c076e1ed", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.4016877999378224, "ground_truth": 0}, {"key": "c87e99f422b46c03ce77e7cd064bff87c076e1ed", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.42441201390421224, "ground_truth": 0}, {"key": "c87e99f422b46c03ce77e7cd064bff87c076e1ed", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.3380771299860626, "ground_truth": 0}, {"key": "c87e99f422b46c03ce77e7cd064bff87c076e1ed", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.28616925524162135, "ground_truth": 0}, {"key": "aaca402152fbea1b16e14999374f6394520289a8", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.43974734138578636, "ground_truth": 0}, {"key": "aaca402152fbea1b16e14999374f6394520289a8", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.7505527617804493, "ground_truth": 0}, {"key": "aaca402152fbea1b16e14999374f6394520289a8", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.8233283928498577, "ground_truth": 0}, {"key": "aaca402152fbea1b16e14999374f6394520289a8", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.6495786578951305, "ground_truth": 0}, {"key": "aaca402152fbea1b16e14999374f6394520289a8", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.7892336937004049, "ground_truth": 0}, {"key": "259d8cccfcb9b9edc00d757ec6efecde6fc06110", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.5851011529775947, "ground_truth": 0}, {"key": "259d8cccfcb9b9edc00d757ec6efecde6fc06110", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.6187804353377026, "ground_truth": 0}, {"key": "259d8cccfcb9b9edc00d757ec6efecde6fc06110", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.4225046082731046, "ground_truth": 0}, {"key": "259d8cccfcb9b9edc00d757ec6efecde6fc06110", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.42632162211704655, "ground_truth": 0}, {"key": "259d8cccfcb9b9edc00d757ec6efecde6fc06110", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.2909808617424927, "ground_truth": 0}, {"key": "d076dbce6e84b20153db61c809d0f01f46ef1f45", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.7648916180200139, "ground_truth": 0}, {"key": "d076dbce6e84b20153db61c809d0f01f46ef1f45", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.8428631479317068, "ground_truth": 0}, {"key": "d076dbce6e84b20153db61c809d0f01f46ef1f45", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.890294223221071, "ground_truth": 0}, {"key": "d076dbce6e84b20153db61c809d0f01f46ef1f45", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.7592254082789095, "ground_truth": 0}, {"key": "d076dbce6e84b20153db61c809d0f01f46ef1f45", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.8740772420627616, "ground_truth": 0}, {"key": "c74e983d24450ed9c4ba3a97e345bba707d26853", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.8019358277150169, "ground_truth": 0}, {"key": "c74e983d24450ed9c4ba3a97e345bba707d26853", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.7732163699746145, "ground_truth": 0}, {"key": "c74e983d24450ed9c4ba3a97e345bba707d26853", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.7634837682413979, "ground_truth": 0}, {"key": "c74e983d24450ed9c4ba3a97e345bba707d26853", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.7106283097338122, "ground_truth": 0}, {"key": "c74e983d24450ed9c4ba3a97e345bba707d26853", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.8397339672254274, "ground_truth": 0}, {"key": "0922357b2d0439cf4ba6ec9dc143e11a38b49d8a", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.7264256356921505, "ground_truth": 0}, {"key": "0922357b2d0439cf4ba6ec9dc143e11a38b49d8a", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.8354835526283209, "ground_truth": 0}, {"key": "0922357b2d0439cf4ba6ec9dc143e11a38b49d8a", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.6261241698133081, "ground_truth": 0}, {"key": "0922357b2d0439cf4ba6ec9dc143e11a38b49d8a", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.7185943943871831, "ground_truth": 0}, {"key": "0922357b2d0439cf4ba6ec9dc143e11a38b49d8a", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.5136684888723686, "ground_truth": 0}, {"key": "c62ea6aaf31a7f5b6a7c2eac7780c86f9baed786", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.5117166040600629, "ground_truth": 0}, {"key": "c62ea6aaf31a7f5b6a7c2eac7780c86f9baed786", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.8397339750768115, "ground_truth": 0}, {"key": "c62ea6aaf31a7f5b6a7c2eac7780c86f9baed786", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.6334102631386691, "ground_truth": 0}, {"key": "c62ea6aaf31a7f5b6a7c2eac7780c86f9baed786", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.5019531379060227, "ground_truth": 0}, {"key": "c62ea6aaf31a7f5b6a7c2eac7780c86f9baed786", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.5945512670591185, "ground_truth": 0}, {"key": "6bb04883f35820a450ff821eda46a4002c0fc7e9", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.9334308118766518, "ground_truth": 0}, {"key": "6bb04883f35820a450ff821eda46a4002c0fc7e9", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.6859494488646845, "ground_truth": 0}, {"key": "6bb04883f35820a450ff821eda46a4002c0fc7e9", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.7008947864448143, "ground_truth": 0}, {"key": "6bb04883f35820a450ff821eda46a4002c0fc7e9", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.7341195641388586, "ground_truth": 0}, {"key": "6bb04883f35820a450ff821eda46a4002c0fc7e9", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.661922850457978, "ground_truth": 0}, {"key": "71f87a7cbda73f1c0656d811b0026437e4ee4aa0", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.7634837649268972, "ground_truth": 0}, {"key": "71f87a7cbda73f1c0656d811b0026437e4ee4aa0", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.9149009595268548, "ground_truth": 0}, {"key": "71f87a7cbda73f1c0656d811b0026437e4ee4aa0", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.9053223010175891, "ground_truth": 0}, {"key": "71f87a7cbda73f1c0656d811b0026437e4ee4aa0", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.6095241583478009, "ground_truth": 0}, {"key": "71f87a7cbda73f1c0656d811b0026437e4ee4aa0", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.7648916128233734, "ground_truth": 0}, {"key": "fa5089d759a9fb810d28c140cf60e3a5fffff8ba", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.6020615794377153, "ground_truth": 0}, {"key": "fa5089d759a9fb810d28c140cf60e3a5fffff8ba", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.3328523555437525, "ground_truth": 0}, {"key": "fa5089d759a9fb810d28c140cf60e3a5fffff8ba", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.5544704501227669, "ground_truth": 0}, {"key": "fa5089d759a9fb810d28c140cf60e3a5fffff8ba", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.7090191602353282, "ground_truth": 0}, {"key": "fa5089d759a9fb810d28c140cf60e3a5fffff8ba", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.5097643649280517, "ground_truth": 0}, {"key": "1f9aed77465301d7f3787a29555754a03728c4b7", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.6334102685355094, "ground_truth": 0}, {"key": "1f9aed77465301d7f3787a29555754a03728c4b7", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.2814056008723915, "ground_truth": 0}, {"key": "1f9aed77465301d7f3787a29555754a03728c4b7", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.232310140391172, "ground_truth": 0}, {"key": "1f9aed77465301d7f3787a29555754a03728c4b7", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.6706082788410638, "ground_truth": 0}, {"key": "1f9aed77465301d7f3787a29555754a03728c4b7", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.3504213756809932, "ground_truth": 0}, {"key": "7237201bcb7291f2ededb818f901a451356db34b", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.6150878646310566, "ground_truth": 0}, {"key": "7237201bcb7291f2ededb818f901a451356db34b", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.6774740300309405, "ground_truth": 0}, {"key": "7237201bcb7291f2ededb818f901a451356db34b", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.7892337000694638, "ground_truth": 0}, {"key": "7237201bcb7291f2ededb818f901a451356db34b", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.33633106964440374, "ground_truth": 0}, {"key": "7237201bcb7291f2ededb818f901a451356db34b", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.7732163771800132, "ground_truth": 0}, {"key": "38d13d78fedc889784ffb3cb213a758c758be145", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.4111108610891143, "ground_truth": 0}, {"key": "38d13d78fedc889784ffb3cb213a758c758be145", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.8354835526283209, "ground_truth": 0}, {"key": "38d13d78fedc889784ffb3cb213a758c758be145", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.4882833855215125, "ground_truth": 0}, {"key": "38d13d78fedc889784ffb3cb213a758c758be145", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.5813030785896144, "ground_truth": 0}, {"key": "38d13d78fedc889784ffb3cb213a758c758be145", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.5448014110424166, "ground_truth": 0}, {"key": "98fd4b91ec12241a96493471a3e21c9ab96ec523", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.851952808900066, "ground_truth": 0}, {"key": "98fd4b91ec12241a96493471a3e21c9ab96ec523", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.8856314772137368, "ground_truth": 0}, {"key": "98fd4b91ec12241a96493471a3e21c9ab96ec523", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.8832359910539356, "ground_truth": 0}, {"key": "98fd4b91ec12241a96493471a3e21c9ab96ec523", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.9046505299856692, "ground_truth": 0}, {"key": "98fd4b91ec12241a96493471a3e21c9ab96ec523", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.8587185886457377, "ground_truth": 0}, {"key": "8cefdd23a829375abeb18b9bd44bb053a67dfdf8", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.6297745919912668, "ground_truth": 0}, {"key": "8cefdd23a829375abeb18b9bd44bb053a67dfdf8", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.7295197819223462, "ground_truth": 0}, {"key": "8cefdd23a829375abeb18b9bd44bb053a67dfdf8", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.724870284657095, "ground_truth": 0}, {"key": "8cefdd23a829375abeb18b9bd44bb053a67dfdf8", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.6424324741921079, "ground_truth": 0}, {"key": "8cefdd23a829375abeb18b9bd44bb053a67dfdf8", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.7648916183519258, "ground_truth": 0}, {"key": "3de916a84cae6c1dee0076f4e5d6e26fc95c3242", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.779992900168737, "ground_truth": 0}, {"key": "3de916a84cae6c1dee0076f4e5d6e26fc95c3242", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.6531269292132786, "ground_truth": 0}, {"key": "3de916a84cae6c1dee0076f4e5d6e26fc95c3242", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.774583391812735, "ground_truth": 0}, {"key": "3de916a84cae6c1dee0076f4e5d6e26fc95c3242", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.8175744774036824, "ground_truth": 0}, {"key": "3de916a84cae6c1dee0076f4e5d6e26fc95c3242", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.7431680093162517, "ground_truth": 0}, {"key": "24611abacb038c28a84c76b10165e474ac0fdd7e", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.484380078651202, "ground_truth": 0}, {"key": "24611abacb038c28a84c76b10165e474ac0fdd7e", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.5370413930923517, "ground_truth": 0}, {"key": "24611abacb038c28a84c76b10165e474ac0fdd7e", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.47268347390428495, "ground_truth": 0}, {"key": "24611abacb038c28a84c76b10165e474ac0fdd7e", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.573678400545477, "ground_truth": 0}, {"key": "24611abacb038c28a84c76b10165e474ac0fdd7e", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.6261241940847835, "ground_truth": 0}, {"key": "4f3178963b84a0e3625f7486b045872c665073d7", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.2720245576638481, "ground_truth": 0}, {"key": "4f3178963b84a0e3625f7486b045872c665073d7", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.4629586082081088, "ground_truth": 0}, {"key": "4f3178963b84a0e3625f7486b045872c665073d7", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.3504213773217679, "ground_truth": 0}, {"key": "4f3178963b84a0e3625f7486b045872c665073d7", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.2379298999882713, "ground_truth": 0}, {"key": "4f3178963b84a0e3625f7486b045872c665073d7", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.19682620402667192, "ground_truth": 0}, {"key": "6ff0470115b556c80229f4305c23afa683c9f8da", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.4130035981815759, "ground_truth": 0}, {"key": "6ff0470115b556c80229f4305c23afa683c9f8da", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.7745833753349496, "ground_truth": 0}, {"key": "6ff0470115b556c80229f4305c23afa683c9f8da", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.6859494571223851, "ground_truth": 0}, {"key": "6ff0470115b556c80229f4305c23afa683c9f8da", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.6636689519666261, "ground_truth": 0}, {"key": "6ff0470115b556c80229f4305c23afa683c9f8da", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.6039318274051672, "ground_truth": 0}, {"key": "4be9a7e5e9115eb681541c4a8d247ac84f0eb774", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.5717665938498604, "ground_truth": 0}, {"key": "4be9a7e5e9115eb681541c4a8d247ac84f0eb774", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.7264256109317745, "ground_truth": 0}, {"key": "4be9a7e5e9115eb681541c4a8d247ac84f0eb774", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.6706082527199704, "ground_truth": 0}, {"key": "4be9a7e5e9115eb681541c4a8d247ac84f0eb774", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.734119531281345, "ground_truth": 0}, {"key": "4be9a7e5e9115eb681541c4a8d247ac84f0eb774", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.709019132244254, "ground_truth": 0}, {"key": "de3ba4e29501a10effcbb5a61e7b9c0ab3721669", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.8783142482124212, "ground_truth": 0}, {"key": "de3ba4e29501a10effcbb5a61e7b9c0ab3721669", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.9334308089377925, "ground_truth": 0}, {"key": "de3ba4e29501a10effcbb5a61e7b9c0ab3721669", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.7233094686277953, "ground_truth": 0}, {"key": "de3ba4e29501a10effcbb5a61e7b9c0ab3721669", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.5813030902165556, "ground_truth": 0}, {"key": "de3ba4e29501a10effcbb5a61e7b9c0ab3721669", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.8577681082415775, "ground_truth": 0}, {"key": "d23090b75384c925e7f20b1ec5218394b52eae38", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.43590152066673954, "ground_truth": 0}, {"key": "d23090b75384c925e7f20b1ec5218394b52eae38", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.5755879880306002, "ground_truth": 0}, {"key": "d23090b75384c925e7f20b1ec5218394b52eae38", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.5907792200439796, "ground_truth": 0}, {"key": "d23090b75384c925e7f20b1ec5218394b52eae38", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.585101175759902, "ground_truth": 0}, {"key": "d23090b75384c925e7f20b1ec5218394b52eae38", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.5602526657409048, "ground_truth": 0}, {"key": "98008fdd5ea99bc7c437d6e1aa86c750bf667415", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.5851011547436339, "ground_truth": 0}, {"key": "98008fdd5ea99bc7c437d6e1aa86c750bf667415", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.5563995922915907, "ground_truth": 0}, {"key": "98008fdd5ea99bc7c437d6e1aa86c750bf667415", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.3611647050557153, "ground_truth": 0}, {"key": "98008fdd5ea99bc7c437d6e1aa86c750bf667415", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.41679663687953067, "ground_truth": 0}, {"key": "98008fdd5ea99bc7c437d6e1aa86c750bf667415", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.31236999561103956, "ground_truth": 0}, {"key": "fd13c81373473f862d0f3559ffbc2a03fa95f492", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.133867493222594, "ground_truth": 0}, {"key": "fd13c81373473f862d0f3559ffbc2a03fa95f492", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.21337716519651773, "ground_truth": 0}, {"key": "fd13c81373473f862d0f3559ffbc2a03fa95f492", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.21733751029821136, "ground_truth": 0}, {"key": "fd13c81373473f862d0f3559ffbc2a03fa95f492", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.2146914139676869, "ground_truth": 0}, {"key": "fd13c81373473f862d0f3559ffbc2a03fa95f492", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.14414884467107927, "ground_truth": 0}, {"key": "ad275932d9fb03762cc781e06955fb088e165ad9", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.6424324798767438, "ground_truth": 0}, {"key": "ad275932d9fb03762cc781e06955fb088e165ad9", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.3942009808665941, "ground_truth": 0}, {"key": "ad275932d9fb03762cc781e06955fb088e165ad9", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.8688267819295659, "ground_truth": 0}, {"key": "ad275932d9fb03762cc781e06955fb088e165ad9", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.45713672003641215, "ground_truth": 0}, {"key": "ad275932d9fb03762cc781e06955fb088e165ad9", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.3702253953933585, "ground_truth": 0}, {"key": "f9fedde4734d8ac3431c0ed5d338efcd799b1aea", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.35042137061696027, "ground_truth": 0}, {"key": "f9fedde4734d8ac3431c0ed5d338efcd799b1aea", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.22541660430147908, "ground_truth": 0}, {"key": "f9fedde4734d8ac3431c0ed5d338efcd799b1aea", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.34864513528418845, "ground_truth": 0}, {"key": "f9fedde4734d8ac3431c0ed5d338efcd799b1aea", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.26133091835600997, "ground_truth": 0}, {"key": "f9fedde4734d8ac3431c0ed5d338efcd799b1aea", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.2861692462765795, "ground_truth": 0}, {"key": "bbe84a85e38aac4e2cff76da7ce4ed349474db25", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.5755879980996964, "ground_truth": 0}, {"key": "bbe84a85e38aac4e2cff76da7ce4ed349474db25", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.6531269010676584, "ground_truth": 0}, {"key": "bbe84a85e38aac4e2cff76da7ce4ed349474db25", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.278256794208085, "ground_truth": 0}, {"key": "bbe84a85e38aac4e2cff76da7ce4ed349474db25", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.33285234427725474, "ground_truth": 0}, {"key": "bbe84a85e38aac4e2cff76da7ce4ed349474db25", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.6513548740190064, "ground_truth": 0}, {"key": "45884af9aff9abf54fec27f510c3f9ed000fc6e1", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.7648916107571085, "ground_truth": 0}, {"key": "45884af9aff9abf54fec27f510c3f9ed000fc6e1", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.46490158997639547, "ground_truth": 0}, {"key": "45884af9aff9abf54fec27f510c3f9ed000fc6e1", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.5019531141382709, "ground_truth": 0}, {"key": "45884af9aff9abf54fec27f510c3f9ed000fc6e1", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.7505527711592159, "ground_truth": 0}, {"key": "45884af9aff9abf54fec27f510c3f9ed000fc6e1", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.712232177883793, "ground_truth": 0}, {"key": "59e60ba3c7ea5f5991db8ed4afd368c69e697dde", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.6076631543445349, "ground_truth": 0}, {"key": "59e60ba3c7ea5f5991db8ed4afd368c69e697dde", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.6001883404413765, "ground_truth": 0}, {"key": "59e60ba3c7ea5f5991db8ed4afd368c69e697dde", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.845942433855647, "ground_truth": 0}, {"key": "59e60ba3c7ea5f5991db8ed4afd368c69e697dde", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.7248702853915765, "ground_truth": 0}, {"key": "59e60ba3c7ea5f5991db8ed4afd368c69e697dde", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.8116760051681322, "ground_truth": 0}, {"key": "265ad4cbd8cbad94527db327a39c2d8f33db33ce", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.39047584837793736, "ground_truth": 0}, {"key": "265ad4cbd8cbad94527db327a39c2d8f33db33ce", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.712232180603451, "ground_truth": 0}, {"key": "265ad4cbd8cbad94527db327a39c2d8f33db33ce", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.2974699472457046, "ground_truth": 0}, {"key": "265ad4cbd8cbad94527db327a39c2d8f33db33ce", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.2643583670087683, "ground_truth": 0}, {"key": "265ad4cbd8cbad94527db327a39c2d8f33db33ce", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.3942009572241804, "ground_truth": 0}, {"key": "54e68f9b7cdd209c09b2a47feef62b9082346031", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.7879312016702816, "ground_truth": 0}, {"key": "54e68f9b7cdd209c09b2a47feef62b9082346031", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.654894707625981, "ground_truth": 0}, {"key": "54e68f9b7cdd209c09b2a47feef62b9082346031", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.6859494389860783, "ground_truth": 0}, {"key": "54e68f9b7cdd209c09b2a47feef62b9082346031", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.8128673117526171, "ground_truth": 0}, {"key": "54e68f9b7cdd209c09b2a47feef62b9082346031", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.4765796522190285, "ground_truth": 0}, {"key": "3b5e3dff560e2233e8370c87e9d92461200f8bd4", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.2186693841121755, "ground_truth": 0}, {"key": "3b5e3dff560e2233e8370c87e9d92461200f8bd4", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.5983121665019331, "ground_truth": 0}, {"key": "3b5e3dff560e2233e8370c87e9d92461200f8bd4", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.5, "ground_truth": 0}, {"key": "3b5e3dff560e2233e8370c87e9d92461200f8bd4", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.6206216253177362, "ground_truth": 0}, {"key": "3b5e3dff560e2233e8370c87e9d92461200f8bd4", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.5058590947250391, "ground_truth": 0}, {"key": "242c51d129c998a2585feee12e109a2058eb7c2b", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.6424324726641509, "ground_truth": 0}, {"key": "242c51d129c998a2585feee12e109a2058eb7c2b", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.7634837606675587, "ground_truth": 0}, {"key": "242c51d129c998a2585feee12e109a2058eb7c2b", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.7549149933609558, "ground_truth": 0}, {"key": "242c51d129c998a2585feee12e109a2058eb7c2b", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.611381976722468, "ground_truth": 0}, {"key": "242c51d129c998a2585feee12e109a2058eb7c2b", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.5851011559005421, "ground_truth": 0}, {"key": "5ce92746bc1f4f5cbb25956c1289ffcd7f50f07e", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.36840570251784927, "ground_truth": 0}, {"key": "5ce92746bc1f4f5cbb25956c1289ffcd7f50f07e", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.5292633843235326, "ground_truth": 0}, {"key": "5ce92746bc1f4f5cbb25956c1289ffcd7f50f07e", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.33633105708251515, "ground_truth": 0}, {"key": "5ce92746bc1f4f5cbb25956c1289ffcd7f50f07e", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.31742626409968633, "ground_truth": 0}, {"key": "5ce92746bc1f4f5cbb25956c1289ffcd7f50f07e", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.4960938259801803, "ground_truth": 0}, {"key": "2f32a9eebbfa707a264d82a3bef5557f6b3b5f20", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.5945512832684419, "ground_truth": 0}, {"key": "2f32a9eebbfa707a264d82a3bef5557f6b3b5f20", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.7866228374157168, "ground_truth": 0}, {"key": "2f32a9eebbfa707a264d82a3bef5557f6b3b5f20", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.8895288436851978, "ground_truth": 0}, {"key": "2f32a9eebbfa707a264d82a3bef5557f6b3b5f20", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.782662483052145, "ground_truth": 0}, {"key": "2f32a9eebbfa707a264d82a3bef5557f6b3b5f20", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.7201715073620286, "ground_truth": 0}, {"key": "57a373fa7d17600396fcee99164e79c0edccad14", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.7534666657301282, "ground_truth": 0}, {"key": "57a373fa7d17600396fcee99164e79c0edccad14", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.8791467706841223, "ground_truth": 0}, {"key": "57a373fa7d17600396fcee99164e79c0edccad14", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.854884645207948, "ground_truth": 0}, {"key": "57a373fa7d17600396fcee99164e79c0edccad14", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.8933094037097729, "ground_truth": 0}, {"key": "57a373fa7d17600396fcee99164e79c0edccad14", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.8198933304763312, "ground_truth": 0}, {"key": "9b087c5572cc091c519625d37d1a614b97b8ed30", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.6636689605537932, "ground_truth": 0}, {"key": "9b087c5572cc091c519625d37d1a614b97b8ed30", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.7461389795037684, "ground_truth": 0}, {"key": "9b087c5572cc091c519625d37d1a614b97b8ed30", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.31069437391227345, "ground_truth": 0}, {"key": "9b087c5572cc091c519625d37d1a614b97b8ed30", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.5156198787401742, "ground_truth": 0}, {"key": "9b087c5572cc091c519625d37d1a614b97b8ed30", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.6584174940880848, "ground_truth": 0}, {"key": "b5211115ff68e12e759a474a02d3b163211af563", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.7325918301483532, "ground_truth": 0}, {"key": "b5211115ff68e12e759a474a02d3b163211af563", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.8624675343154548, "ground_truth": 0}, {"key": "b5211115ff68e12e759a474a02d3b163211af563", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.9173026562061941, "ground_truth": 0}, {"key": "b5211115ff68e12e759a474a02d3b163211af563", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.8807970786283146, "ground_truth": 0}, {"key": "b5211115ff68e12e759a474a02d3b163211af563", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.8068526126459407, "ground_truth": 0}, {"key": "6b75abea2de5c9c9952af0427ccec78910ac811f", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.7592254026145164, "ground_truth": 0}, {"key": "6b75abea2de5c9c9952af0427ccec78910ac811f", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.6424324665802237, "ground_truth": 0}, {"key": "6b75abea2de5c9c9952af0427ccec78910ac811f", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.5525396780356802, "ground_truth": 0}, {"key": "6b75abea2de5c9c9952af0427ccec78910ac811f", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.5331544292627487, "ground_truth": 0}, {"key": "6b75abea2de5c9c9952af0427ccec78910ac811f", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.7325918465514049, "ground_truth": 0}, {"key": "259cc1db3d4c814dafc02ed071327f65a7b9eaad", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.359364132542935, "ground_truth": 0}, {"key": "259cc1db3d4c814dafc02ed071327f65a7b9eaad", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.7879312047727833, "ground_truth": 0}, {"key": "259cc1db3d4c814dafc02ed071327f65a7b9eaad", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.319121398984643, "ground_truth": 0}, {"key": "259cc1db3d4c814dafc02ed071327f65a7b9eaad", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.39606813113531325, "ground_truth": 0}, {"key": "259cc1db3d4c814dafc02ed071327f65a7b9eaad", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.6169358439184739, "ground_truth": 0}, {"key": "3bb1cda1e01cb6e14f6190ced3b1ec3f7ef50de9", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.3451052746595105, "ground_truth": 0}, {"key": "3bb1cda1e01cb6e14f6190ced3b1ec3f7ef50de9", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.7138307272615828, "ground_truth": 0}, {"key": "3bb1cda1e01cb6e14f6190ced3b1ec3f7ef50de9", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.43014733601281974, "ground_truth": 0}, {"key": "3bb1cda1e01cb6e14f6190ced3b1ec3f7ef50de9", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.46295860383889986, "ground_truth": 0}, {"key": "3bb1cda1e01cb6e14f6190ced3b1ec3f7ef50de9", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.5195213486905687, "ground_truth": 0}, {"key": "7afbe903f1f7cdc1af509583649babf481d01729", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.6261241743053636, "ground_truth": 0}, {"key": "7afbe903f1f7cdc1af509583649babf481d01729", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.4980468974766409, "ground_truth": 0}, {"key": "7afbe903f1f7cdc1af509583649babf481d01729", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.5467381438853587, "ground_truth": 0}, {"key": "7afbe903f1f7cdc1af509583649babf481d01729", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.7520125607938405, "ground_truth": 0}, {"key": "7afbe903f1f7cdc1af509583649babf481d01729", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.7106282998951254, "ground_truth": 0}, {"key": "79d625a3311f4ff11598a3ae4fca63103e84e9a1", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.5409238728828495, "ground_truth": 0}, {"key": "79d625a3311f4ff11598a3ae4fca63103e84e9a1", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.498046882594141, "ground_truth": 0}, {"key": "79d625a3311f4ff11598a3ae4fca63103e84e9a1", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.6688802632358972, "ground_truth": 0}, {"key": "79d625a3311f4ff11598a3ae4fca63103e84e9a1", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.5525397261139349, "ground_truth": 0}, {"key": "79d625a3311f4ff11598a3ae4fca63103e84e9a1", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.5, "ground_truth": 0}, {"key": "ea6c4267f17d55f1bd9f0950c31ef59565bdc30b", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.6723317118782162, "ground_truth": 0}, {"key": "ea6c4267f17d55f1bd9f0950c31ef59565bdc30b", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.799442314911979, "ground_truth": 0}, {"key": "ea6c4267f17d55f1bd9f0950c31ef59565bdc30b", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.6442251002614631, "ground_truth": 0}, {"key": "ea6c4267f17d55f1bd9f0950c31ef59565bdc30b", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.8397339610608994, "ground_truth": 0}, {"key": "ea6c4267f17d55f1bd9f0950c31ef59565bdc30b", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.8175744840076703, "ground_truth": 0}, {"key": "851d02b689bec14607574096bb77b9acf53c15ee", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.763483765162903, "ground_truth": 0}, {"key": "851d02b689bec14607574096bb77b9acf53c15ee", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.8354835338331381, "ground_truth": 0}, {"key": "851d02b689bec14607574096bb77b9acf53c15ee", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.6791787002954671, "ground_truth": 0}, {"key": "851d02b689bec14607574096bb77b9acf53c15ee", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.62977460411516, "ground_truth": 0}, {"key": "851d02b689bec14607574096bb77b9acf53c15ee", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.6654105929092855, "ground_truth": 0}, {"key": "f2d00c8c396698becc18fd2b41ba595c7a3e1cc6", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.9695556506619992, "ground_truth": 0}, {"key": "f2d00c8c396698becc18fd2b41ba595c7a3e1cc6", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.9913558227205088, "ground_truth": 0}, {"key": "f2d00c8c396698becc18fd2b41ba595c7a3e1cc6", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.9802808727624455, "ground_truth": 0}, {"key": "f2d00c8c396698becc18fd2b41ba595c7a3e1cc6", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.9857180666418803, "ground_truth": 0}, {"key": "f2d00c8c396698becc18fd2b41ba595c7a3e1cc6", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.9715639666719379, "ground_truth": 0}, {"key": "70c6ca3234f9b1221c8aea7671dd78e1ca9d9139", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.297469951169549, "ground_truth": 0}, {"key": "70c6ca3234f9b1221c8aea7671dd78e1ca9d9139", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.4436004347846038, "ground_truth": 0}, {"key": "70c6ca3234f9b1221c8aea7671dd78e1ca9d9139", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.32082130970629275, "ground_truth": 0}, {"key": "70c6ca3234f9b1221c8aea7671dd78e1ca9d9139", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.4843800735352734, "ground_truth": 0}, {"key": "70c6ca3234f9b1221c8aea7671dd78e1ca9d9139", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.40356687727877794, "ground_truth": 0}, {"key": "86eaa90c419d5ed93341248fecd8c25d820f2b82", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.6740504681333387, "ground_truth": 0}, {"key": "86eaa90c419d5ed93341248fecd8c25d820f2b82", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.5851011645340801, "ground_truth": 0}, {"key": "86eaa90c419d5ed93341248fecd8c25d820f2b82", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.6424324704819917, "ground_truth": 0}, {"key": "86eaa90c419d5ed93341248fecd8c25d820f2b82", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.679178694351234, "ground_truth": 0}, {"key": "86eaa90c419d5ed93341248fecd8c25d820f2b82", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.6876299890721139, "ground_truth": 0}, {"key": "a1841cf61c53937fffc54c0e81d8f7cfcad2f0c2", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.41679665849076947, "ground_truth": 0}, {"key": "a1841cf61c53937fffc54c0e81d8f7cfcad2f0c2", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.32423539065666873, "ground_truth": 0}, {"key": "a1841cf61c53937fffc54c0e81d8f7cfcad2f0c2", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.6057990629364223, "ground_truth": 0}, {"key": "a1841cf61c53937fffc54c0e81d8f7cfcad2f0c2", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.42823339975311375, "ground_truth": 0}, {"key": "a1841cf61c53937fffc54c0e81d8f7cfcad2f0c2", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.6584175002324266, "ground_truth": 0}, {"key": "5d221c86fdadca378eeaabc39c881cc74efcff07", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.3276683006019352, "ground_truth": 0}, {"key": "5d221c86fdadca378eeaabc39c881cc74efcff07", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.290980867547576, "ground_truth": 0}, {"key": "5d221c86fdadca378eeaabc39c881cc74efcff07", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.4804786823442202, "ground_truth": 0}, {"key": "5d221c86fdadca378eeaabc39c881cc74efcff07", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.35756753295381566, "ground_truth": 0}, {"key": "5d221c86fdadca378eeaabc39c881cc74efcff07", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.5907791993065767, "ground_truth": 0}, {"key": "7a49f5bc1d336309f57076bceba91885ee5368b5", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.8991213763983242, "ground_truth": 0}, {"key": "7a49f5bc1d336309f57076bceba91885ee5368b5", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.8661325136757823, "ground_truth": 0}, {"key": "7a49f5bc1d336309f57076bceba91885ee5368b5", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.6893056253761615, "ground_truth": 0}, {"key": "7a49f5bc1d336309f57076bceba91885ee5368b5", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.8969755813000115, "ground_truth": 0}, {"key": "7a49f5bc1d336309f57076bceba91885ee5368b5", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.9653811622605443, "ground_truth": 0}, {"key": "dd46893fd318dce4e209f9a335612659ebf8fd24", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.5888891238672073, "ground_truth": 0}, {"key": "dd46893fd318dce4e209f9a335612659ebf8fd24", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.8068526121929476, "ground_truth": 0}, {"key": "dd46893fd318dce4e209f9a335612659ebf8fd24", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.5136684864470509, "ground_truth": 0}, {"key": "dd46893fd318dce4e209f9a335612659ebf8fd24", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.7295197827903683, "ground_truth": 0}, {"key": "dd46893fd318dce4e209f9a335612659ebf8fd24", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.490235634062707, "ground_truth": 0}, {"key": "acda8749fba5e9553e9f47cef89ef85eae5ad4e3", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.6132365444211948, "ground_truth": 0}, {"key": "acda8749fba5e9553e9f47cef89ef85eae5ad4e3", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.6076631852874719, "ground_truth": 0}, {"key": "acda8749fba5e9553e9f47cef89ef85eae5ad4e3", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.4687906491006963, "ground_truth": 0}, {"key": "acda8749fba5e9553e9f47cef89ef85eae5ad4e3", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.6636689516566232, "ground_truth": 0}, {"key": "acda8749fba5e9553e9f47cef89ef85eae5ad4e3", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.8354835314106622, "ground_truth": 0}, {"key": "20b11518df6520f552d691d5f6c0d02755d11809", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.6825737260654225, "ground_truth": 0}, {"key": "20b11518df6520f552d691d5f6c0d02755d11809", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.41300356672108707, "ground_truth": 0}, {"key": "20b11518df6520f552d691d5f6c0d02755d11809", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.2494472226005939, "ground_truth": 0}, {"key": "20b11518df6520f552d691d5f6c0d02755d11809", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.4980468684956558, "ground_truth": 0}, {"key": "20b11518df6520f552d691d5f6c0d02755d11809", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.5525397224330613, "ground_truth": 0}, {"key": "51fe083191bb5568bf6a5fea1610a8e19663d7b2", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.8164063633479002, "ground_truth": 0}, {"key": "51fe083191bb5568bf6a5fea1610a8e19663d7b2", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.5983122122752293, "ground_truth": 0}, {"key": "51fe083191bb5568bf6a5fea1610a8e19663d7b2", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.6370308049325828, "ground_truth": 0}, {"key": "51fe083191bb5568bf6a5fea1610a8e19663d7b2", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.6224593208356118, "ground_truth": 0}, {"key": "51fe083191bb5568bf6a5fea1610a8e19663d7b2", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.6601724004056089, "ground_truth": 0}, {"key": "8af047c2d83a91e8b745adfcaa7c282dfe1030a2", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.41300357118929787, "ground_truth": 0}, {"key": "8af047c2d83a91e8b745adfcaa7c282dfe1030a2", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.5058591137649693, "ground_truth": 0}, {"key": "8af047c2d83a91e8b745adfcaa7c282dfe1030a2", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.4320633824603403, "ground_truth": 0}, {"key": "8af047c2d83a91e8b745adfcaa7c282dfe1030a2", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.35756752086161886, "ground_truth": 0}, {"key": "8af047c2d83a91e8b745adfcaa7c282dfe1030a2", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.4707366116807789, "ground_truth": 0}, {"key": "dfcacd955a9168b2cf599c57a539dbfce43ea2a9", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.6261241833335719, "ground_truth": 0}, {"key": "dfcacd955a9168b2cf599c57a539dbfce43ea2a9", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.3904758296085959, "ground_truth": 0}, {"key": "dfcacd955a9168b2cf599c57a539dbfce43ea2a9", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.5, "ground_truth": 0}, {"key": "dfcacd955a9168b2cf599c57a539dbfce43ea2a9", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.7905303090141388, "ground_truth": 0}, {"key": "dfcacd955a9168b2cf599c57a539dbfce43ea2a9", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.6442250864083293, "ground_truth": 0}, {"key": "f2463954bc7215d8a1f98cf0d85f280fd2affa58", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.9046505448783071, "ground_truth": 0}, {"key": "f2463954bc7215d8a1f98cf0d85f280fd2affa58", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.8558511467943462, "ground_truth": 0}, {"key": "f2463954bc7215d8a1f98cf0d85f280fd2affa58", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.7969253648361025, "ground_truth": 0}, {"key": "f2463954bc7215d8a1f98cf0d85f280fd2affa58", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.7106283102682934, "ground_truth": 0}, {"key": "f2463954bc7215d8a1f98cf0d85f280fd2affa58", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.8164063967030935, "ground_truth": 0}, {"key": "0e7a92a6f06e94cdd613860d4a3f4b92a06a2b43", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.615087863599232, "ground_truth": 0}, {"key": "0e7a92a6f06e94cdd613860d4a3f4b92a06a2b43", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.6187804197863022, "ground_truth": 0}, {"key": "0e7a92a6f06e94cdd613860d4a3f4b92a06a2b43", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.6297746002464989, "ground_truth": 0}, {"key": "0e7a92a6f06e94cdd613860d4a3f4b92a06a2b43", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.535098404289177, "ground_truth": 0}, {"key": "0e7a92a6f06e94cdd613860d4a3f4b92a06a2b43", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.8652240911559859, "ground_truth": 0}, {"key": "2905a15c5947042e42f4b52dc201d24822af20f1", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.7264256125157044, "ground_truth": 0}, {"key": "2905a15c5947042e42f4b52dc201d24822af20f1", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.5156199273471701, "ground_truth": 0}, {"key": "2905a15c5947042e42f4b52dc201d24822af20f1", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.7185943941366737, "ground_truth": 0}, {"key": "2905a15c5947042e42f4b52dc201d24822af20f1", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.5583270288922303, "ground_truth": 0}, {"key": "2905a15c5947042e42f4b52dc201d24822af20f1", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.7799928968933864, "ground_truth": 0}, {"key": "808a3d788317af05686ee71a71d2fbc5c19267bc", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.7248702723522917, "ground_truth": 0}, {"key": "808a3d788317af05686ee71a71d2fbc5c19267bc", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.4436004160234485, "ground_truth": 0}, {"key": "808a3d788317af05686ee71a71d2fbc5c19267bc", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.5214711655657155, "ground_truth": 0}, {"key": "808a3d788317af05686ee71a71d2fbc5c19267bc", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.5964331302521446, "ground_truth": 0}, {"key": "808a3d788317af05686ee71a71d2fbc5c19267bc", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.4551985971689643, "ground_truth": 0}, {"key": "5a1bec30205b6938392f3119366e27d15b4849e8", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.4824291068757584, "ground_truth": 0}, {"key": "5a1bec30205b6938392f3119366e27d15b4849e8", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.4902356214526889, "ground_truth": 0}, {"key": "5a1bec30205b6938392f3119366e27d15b4849e8", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.32423538859729695, "ground_truth": 0}, {"key": "5a1bec30205b6938392f3119366e27d15b4849e8", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.5428632868010903, "ground_truth": 0}, {"key": "5a1bec30205b6938392f3119366e27d15b4849e8", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.2658804632189717, "ground_truth": 0}, {"key": "7ff39e1220c0f084434786ed145e15c6abe48def", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.7106282824561753, "ground_truth": 0}, {"key": "7ff39e1220c0f084434786ed145e15c6abe48def", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.76065066877006, "ground_truth": 0}, {"key": "7ff39e1220c0f084434786ed145e15c6abe48def", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.6424324642252351, "ground_truth": 0}, {"key": "7ff39e1220c0f084434786ed145e15c6abe48def", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.8056321865073373, "ground_truth": 0}, {"key": "7ff39e1220c0f084434786ed145e15c6abe48def", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.7310585844111217, "ground_truth": 0}, {"key": "7551503e7e57bd519913b0df90ca1e80d5305b05", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.757794390195519, "ground_truth": 0}, {"key": "7551503e7e57bd519913b0df90ca1e80d5305b05", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.5273165270195852, "ground_truth": 0}, {"key": "7551503e7e57bd519913b0df90ca1e80d5305b05", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.5832033623709222, "ground_truth": 0}, {"key": "7551503e7e57bd519913b0df90ca1e80d5305b05", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.39981164061824653, "ground_truth": 0}, {"key": "7551503e7e57bd519913b0df90ca1e80d5305b05", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.7386690774977867, "ground_truth": 0}, {"key": "c34a0cbf6db61323766fc86b1b89b399ff6b0666", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.3775406597919713, "ground_truth": 0}, {"key": "c34a0cbf6db61323766fc86b1b89b399ff6b0666", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.505859105940365, "ground_truth": 0}, {"key": "c34a0cbf6db61323766fc86b1b89b399ff6b0666", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.5389832148275625, "ground_truth": 0}, {"key": "c34a0cbf6db61323766fc86b1b89b399ff6b0666", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.36658974868543576, "ground_truth": 0}, {"key": "c34a0cbf6db61323766fc86b1b89b399ff6b0666", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.5156199090473811, "ground_truth": 0}, {"key": "d07a61368a195444b14bd4b382e0fc3d64890b22", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.7057850434014956, "ground_truth": 0}, {"key": "d07a61368a195444b14bd4b382e0fc3d64890b22", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.3979384131026569, "ground_truth": 0}, {"key": "d07a61368a195444b14bd4b382e0fc3d64890b22", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.6943026732538116, "ground_truth": 0}, {"key": "d07a61368a195444b14bd4b382e0fc3d64890b22", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.6531269053624374, "ground_truth": 0}, {"key": "d07a61368a195444b14bd4b382e0fc3d64890b22", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.7690802422895927, "ground_truth": 0}, {"key": "aa68dee4bc246e5aae9507342f8520a2a301a310", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.21076629709601574, "ground_truth": 0}, {"key": "aa68dee4bc246e5aae9507342f8520a2a301a310", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.5774953710555571, "ground_truth": 0}, {"key": "aa68dee4bc246e5aae9507342f8520a2a301a310", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.3942009593477402, "ground_truth": 0}, {"key": "aa68dee4bc246e5aae9507342f8520a2a301a310", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.27048023508321506, "ground_truth": 0}, {"key": "aa68dee4bc246e5aae9507342f8520a2a301a310", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.7057850219885071, "ground_truth": 0}, {"key": "87ef15064035db73cb29f5cec2f0442f2c527ef0", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.8428631388495665, "ground_truth": 0}, {"key": "87ef15064035db73cb29f5cec2f0442f2c527ef0", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.6150878484599037, "ground_truth": 0}, {"key": "87ef15064035db73cb29f5cec2f0442f2c527ef0", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.556399578712067, "ground_truth": 0}, {"key": "87ef15064035db73cb29f5cec2f0442f2c527ef0", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.7813306236925066, "ground_truth": 0}, {"key": "87ef15064035db73cb29f5cec2f0442f2c527ef0", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.7549149987378273, "ground_truth": 0}, {"key": "a577b934e210ef7dce07390711f03db8bb2e005a", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.8152325002172365, "ground_truth": 0}, {"key": "a577b934e210ef7dce07390711f03db8bb2e005a", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.856812299110223, "ground_truth": 0}, {"key": "a577b934e210ef7dce07390711f03db8bb2e005a", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.4225046252375981, "ground_truth": 0}, {"key": "a577b934e210ef7dce07390711f03db8bb2e005a", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.6132365345418346, "ground_truth": 0}, {"key": "a577b934e210ef7dce07390711f03db8bb2e005a", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.5448014056214854, "ground_truth": 0}, {"key": "c9414bf55859cb9ca7e925a4a09b416b6f66446a", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.9879462212618305, "ground_truth": 0}, {"key": "c9414bf55859cb9ca7e925a4a09b416b6f66446a", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.9929335989298496, "ground_truth": 0}, {"key": "c9414bf55859cb9ca7e925a4a09b416b6f66446a", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.9963783148220681, "ground_truth": 0}, {"key": "c9414bf55859cb9ca7e925a4a09b416b6f66446a", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.991684221346811, "ground_truth": 0}, {"key": "c9414bf55859cb9ca7e925a4a09b416b6f66446a", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.9905142860454358, "ground_truth": 0}, {"key": "f12cda150b96acfa1499b2afb0a81029545abadf", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.6876299910952661, "ground_truth": 0}, {"key": "f12cda150b96acfa1499b2afb0a81029545abadf", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.5736784267980409, "ground_truth": 0}, {"key": "f12cda150b96acfa1499b2afb0a81029545abadf", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.7745833978568522, "ground_truth": 0}, {"key": "f12cda150b96acfa1499b2afb0a81029545abadf", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.7310585503563124, "ground_truth": 0}, {"key": "f12cda150b96acfa1499b2afb0a81029545abadf", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.665410557684395, "ground_truth": 0}, {"key": "7359741b0e60b4402f069963a26c7aa766f45e7c", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.37754067411375114, "ground_truth": 0}, {"key": "7359741b0e60b4402f069963a26c7aa766f45e7c", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.48633154137418877, "ground_truth": 0}, {"key": "7359741b0e60b4402f069963a26c7aa766f45e7c", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.42823339021823575, "ground_truth": 0}, {"key": "7359741b0e60b4402f069963a26c7aa766f45e7c", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.562176491191213, "ground_truth": 0}, {"key": "7359741b0e60b4402f069963a26c7aa766f45e7c", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.5583269882373436, "ground_truth": 0}, {"key": "b10c71f49dbeabad23325d625e8e7b8529429607", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.793105939886807, "ground_truth": 0}, {"key": "b10c71f49dbeabad23325d625e8e7b8529429607", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.5794003998824117, "ground_truth": 0}, {"key": "b10c71f49dbeabad23325d625e8e7b8529429607", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.6460136864933006, "ground_truth": 0}, {"key": "b10c71f49dbeabad23325d625e8e7b8529429607", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.464901573764378, "ground_truth": 0}, {"key": "b10c71f49dbeabad23325d625e8e7b8529429607", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.6513548660849611, "ground_truth": 0}, {"key": "c5a1e04f5f84d406ffedfc2f312c314d1bc03c46", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.3942009400376686, "ground_truth": 0}, {"key": "c5a1e04f5f84d406ffedfc2f312c314d1bc03c46", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.3328523284639543, "ground_truth": 0}, {"key": "c5a1e04f5f84d406ffedfc2f312c314d1bc03c46", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.2583259762380431, "ground_truth": 0}, {"key": "c5a1e04f5f84d406ffedfc2f312c314d1bc03c46", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.41869691135998277, "ground_truth": 0}, {"key": "c5a1e04f5f84d406ffedfc2f312c314d1bc03c46", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.2643583579043857, "ground_truth": 0}, {"key": "8a5035d3527c4db4357dd1db9fb2712008dccea9", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.36477756114822824, "ground_truth": 0}, {"key": "8a5035d3527c4db4357dd1db9fb2712008dccea9", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.5214711616422105, "ground_truth": 0}, {"key": "8a5035d3527c4db4357dd1db9fb2712008dccea9", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.5736784160142764, "ground_truth": 0}, {"key": "8a5035d3527c4db4357dd1db9fb2712008dccea9", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.7217432060004823, "ground_truth": 0}, {"key": "8a5035d3527c4db4357dd1db9fb2712008dccea9", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.5583269962309728, "ground_truth": 0}, {"key": "3f33d4cb25cd121619ba99eeb02709b72716d622", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.8289387975124104, "ground_truth": 0}, {"key": "3f33d4cb25cd121619ba99eeb02709b72716d622", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.8568123091082415, "ground_truth": 0}, {"key": "3f33d4cb25cd121619ba99eeb02709b72716d622", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.8104789076572554, "ground_truth": 0}, {"key": "3f33d4cb25cd121619ba99eeb02709b72716d622", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.9130583455328107, "ground_truth": 0}, {"key": "3f33d4cb25cd121619ba99eeb02709b72716d622", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.8679338506517749, "ground_truth": 0}, {"key": "e6f451d6667f142a64818a9d05dbc49115e7cbf9", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.4186968939157123, "ground_truth": 0}, {"key": "e6f451d6667f142a64818a9d05dbc49115e7cbf9", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.9458012689824551, "ground_truth": 0}, {"key": "e6f451d6667f142a64818a9d05dbc49115e7cbf9", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.8479677506960428, "ground_truth": 0}, {"key": "e6f451d6667f142a64818a9d05dbc49115e7cbf9", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.25386102850612363, "ground_truth": 0}, {"key": "e6f451d6667f142a64818a9d05dbc49115e7cbf9", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.8529354899758859, "ground_truth": 0}, {"key": "39622c01625247af942a6439699ff529db1d54d0", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.447460268405015, "ground_truth": 0}, {"key": "39622c01625247af942a6439699ff529db1d54d0", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.3775406717909317, "ground_truth": 0}, {"key": "39622c01625247af942a6439699ff529db1d54d0", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.31573598758954047, "ground_truth": 0}, {"key": "39622c01625247af942a6439699ff529db1d54d0", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.4436004097240941, "ground_truth": 0}, {"key": "39622c01625247af942a6439699ff529db1d54d0", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.302391100441019, "ground_truth": 0}, {"key": "02927c88776bcc84fc883435a5037b4c8ca70e83", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.8479677582890743, "ground_truth": 0}, {"key": "02927c88776bcc84fc883435a5037b4c8ca70e83", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.8962513727836273, "ground_truth": 0}, {"key": "02927c88776bcc84fc883435a5037b4c8ca70e83", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.7718435098502422, "ground_truth": 0}, {"key": "02927c88776bcc84fc883435a5037b4c8ca70e83", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.9092645138475252, "ground_truth": 0}, {"key": "02927c88776bcc84fc883435a5037b4c8ca70e83", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.7704647821123256, "ground_truth": 0}, {"key": "3ee31d8987c07ba4ea9423d39c5e333525316958", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.8519528097275573, "ground_truth": 0}, {"key": "3ee31d8987c07ba4ea9423d39c5e333525316958", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.8633915978981771, "ground_truth": 0}, {"key": "3ee31d8987c07ba4ea9423d39c5e333525316958", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.8365545629169507, "ground_truth": 0}, {"key": "3ee31d8987c07ba4ea9423d39c5e333525316958", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.930962072767408, "ground_truth": 0}, {"key": "3ee31d8987c07ba4ea9423d39c5e333525316958", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.9496693694458148, "ground_truth": 0}, {"key": "f8ddc6d36f378757d27a244529f8fe11672baa41", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.2365162342328957, "ground_truth": 0}, {"key": "f8ddc6d36f378757d27a244529f8fe11672baa41", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.6566582937063282, "ground_truth": 0}, {"key": "f8ddc6d36f378757d27a244529f8fe11672baa41", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.33633107036703264, "ground_truth": 0}, {"key": "f8ddc6d36f378757d27a244529f8fe11672baa41", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.4980468547332375, "ground_truth": 0}, {"key": "f8ddc6d36f378757d27a244529f8fe11672baa41", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.7905303116737219, "ground_truth": 0}, {"key": "4e97228ceef1be54ab9151fc6759017e6a54a18d", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.5640984718888242, "ground_truth": 0}, {"key": "4e97228ceef1be54ab9151fc6759017e6a54a18d", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.6584175184116938, "ground_truth": 0}, {"key": "4e97228ceef1be54ab9151fc6759017e6a54a18d", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.8092759800176295, "ground_truth": 0}, {"key": "4e97228ceef1be54ab9151fc6759017e6a54a18d", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.5409238565921655, "ground_truth": 0}, {"key": "4e97228ceef1be54ab9151fc6759017e6a54a18d", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.6548947238866748, "ground_truth": 0}, {"key": "0e649ccabaf0e650e9757ee256c2749d37486ba6", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.7074046915654146, "ground_truth": 0}, {"key": "0e649ccabaf0e650e9757ee256c2749d37486ba6", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.48828341347283555, "ground_truth": 0}, {"key": "0e649ccabaf0e650e9757ee256c2749d37486ba6", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.44167303734844066, "ground_truth": 0}, {"key": "0e649ccabaf0e650e9757ee256c2749d37486ba6", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.45519855935506337, "ground_truth": 0}, {"key": "0e649ccabaf0e650e9757ee256c2749d37486ba6", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.513668470441458, "ground_truth": 0}, {"key": "9eccfcc231c7c0d65cb0c333cb3d1731a5fe2f3f", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.6791786915059081, "ground_truth": 0}, {"key": "9eccfcc231c7c0d65cb0c333cb3d1731a5fe2f3f", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.5078118487245223, "ground_truth": 0}, {"key": "9eccfcc231c7c0d65cb0c333cb3d1731a5fe2f3f", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.5926665885310692, "ground_truth": 0}, {"key": "9eccfcc231c7c0d65cb0c333cb3d1731a5fe2f3f", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.5195213319931113, "ground_truth": 0}, {"key": "9eccfcc231c7c0d65cb0c333cb3d1731a5fe2f3f", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.5621764820215608, "ground_truth": 0}, {"key": "ddf109b3de6022a4ecd62ee2cd31d2c2ac51035b", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.5, "ground_truth": 0}, {"key": "ddf109b3de6022a4ecd62ee2cd31d2c2ac51035b", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.5409238735952432, "ground_truth": 0}, {"key": "ddf109b3de6022a4ecd62ee2cd31d2c2ac51035b", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.42632159994214813, "ground_truth": 0}, {"key": "ddf109b3de6022a4ecd62ee2cd31d2c2ac51035b", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.5117166024363683, "ground_truth": 0}, {"key": "ddf109b3de6022a4ecd62ee2cd31d2c2ac51035b", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.23370633958706036, "ground_truth": 0}, {"key": "bd92eab23374d95ac4430e2e1a8bf7561c662309", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.6370308038602422, "ground_truth": 0}, {"key": "bd92eab23374d95ac4430e2e1a8bf7561c662309", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.8766343702140372, "ground_truth": 0}, {"key": "bd92eab23374d95ac4430e2e1a8bf7561c662309", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.6531268850369519, "ground_truth": 0}, {"key": "bd92eab23374d95ac4430e2e1a8bf7561c662309", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.7295197453691443, "ground_truth": 0}, {"key": "bd92eab23374d95ac4430e2e1a8bf7561c662309", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.8221891353830003, "ground_truth": 0}, {"key": "d84440effc748f9220c7dde068962e803f566bc7", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.5370413811951564, "ground_truth": 0}, {"key": "d84440effc748f9220c7dde068962e803f566bc7", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.21076631608161753, "ground_truth": 0}, {"key": "d84440effc748f9220c7dde068962e803f566bc7", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.43782349461970727, "ground_truth": 0}, {"key": "d84440effc748f9220c7dde068962e803f566bc7", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.4205995873346433, "ground_truth": 0}, {"key": "d84440effc748f9220c7dde068962e803f566bc7", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.33111974892028173, "ground_truth": 0}, {"key": "e2866f596c85b0191ce812260d23855c70a01192", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.4054487138400643, "ground_truth": 0}, {"key": "e2866f596c85b0191ce812260d23855c70a01192", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.6334102482688836, "ground_truth": 0}, {"key": "e2866f596c85b0191ce812260d23855c70a01192", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.40922078570971226, "ground_truth": 0}, {"key": "e2866f596c85b0191ce812260d23855c70a01192", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.5175708892249979, "ground_truth": 0}, {"key": "e2866f596c85b0191ce812260d23855c70a01192", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.5698526526963483, "ground_truth": 0}, {"key": "4ebd9195bc8c12272b6281a5a610a7b5fb49b8cd", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.72951976837488, "ground_truth": 0}, {"key": "4ebd9195bc8c12272b6281a5a610a7b5fb49b8cd", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.8187367945023756, "ground_truth": 0}, {"key": "4ebd9195bc8c12272b6281a5a610a7b5fb49b8cd", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.729519778209058, "ground_truth": 0}, {"key": "4ebd9195bc8c12272b6281a5a610a7b5fb49b8cd", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.6460136959480242, "ground_truth": 0}, {"key": "4ebd9195bc8c12272b6281a5a610a7b5fb49b8cd", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.7341195243816995, "ground_truth": 0}, {"key": "4bd37aa7004cd1fdf1ccb506d2159a2cf26995e0", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.5907792137347777, "ground_truth": 0}, {"key": "4bd37aa7004cd1fdf1ccb506d2159a2cf26995e0", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.5640984997320283, "ground_truth": 0}, {"key": "4bd37aa7004cd1fdf1ccb506d2159a2cf26995e0", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.7138307654478726, "ground_truth": 0}, {"key": "4bd37aa7004cd1fdf1ccb506d2159a2cf26995e0", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.7905303113246225, "ground_truth": 0}, {"key": "4bd37aa7004cd1fdf1ccb506d2159a2cf26995e0", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.8705972687268911, "ground_truth": 0}, {"key": "29b87dc549b8c64b35517e684e79b1da6316bd88", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.5926665845097006, "ground_truth": 0}, {"key": "29b87dc549b8c64b35517e684e79b1da6316bd88", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.7745833987377908, "ground_truth": 0}, {"key": "29b87dc549b8c64b35517e684e79b1da6316bd88", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.7431680105064671, "ground_truth": 0}, {"key": "29b87dc549b8c64b35517e684e79b1da6316bd88", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.4843800807445793, "ground_truth": 0}, {"key": "29b87dc549b8c64b35517e684e79b1da6316bd88", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.4436004266427974, "ground_truth": 0}, {"key": "d2f2fe0b8797b416bae71305c9d1c874e2fdd0cc", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.53120934880741, "ground_truth": 0}, {"key": "d2f2fe0b8797b416bae71305c9d1c874e2fdd0cc", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.2674081756151721, "ground_truth": 0}, {"key": "d2f2fe0b8797b416bae71305c9d1c874e2fdd0cc", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.6654105701594676, "ground_truth": 0}, {"key": "d2f2fe0b8797b416bae71305c9d1c874e2fdd0cc", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.5983121985276739, "ground_truth": 0}, {"key": "d2f2fe0b8797b416bae71305c9d1c874e2fdd0cc", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.4436004133953311, "ground_truth": 0}, {"key": "0269d39abbea3edadd225fa97d818f5a789b4c72", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.5156199185394651, "ground_truth": 0}, {"key": "0269d39abbea3edadd225fa97d818f5a789b4c72", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.5409238735952432, "ground_truth": 0}, {"key": "0269d39abbea3edadd225fa97d818f5a789b4c72", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.49414092073462657, "ground_truth": 0}, {"key": "0269d39abbea3edadd225fa97d818f5a789b4c72", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.4668456169560539, "ground_truth": 0}, {"key": "0269d39abbea3edadd225fa97d818f5a789b4c72", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.46490156499927665, "ground_truth": 0}, {"key": "394f20c9bee9bc8d0e6a65bac48de57bd9f4733d", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.832236664285591, "ground_truth": 0}, {"key": "394f20c9bee9bc8d0e6a65bac48de57bd9f4733d", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.8376199914969373, "ground_truth": 0}, {"key": "394f20c9bee9bc8d0e6a65bac48de57bd9f4733d", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.6548947100694226, "ground_truth": 0}, {"key": "394f20c9bee9bc8d0e6a65bac48de57bd9f4733d", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.7325918313007753, "ground_truth": 0}, {"key": "394f20c9bee9bc8d0e6a65bac48de57bd9f4733d", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.8749346187815973, "ground_truth": 0}, {"key": "6e63c8b1ae01ab91b4832222edaf4bb461b6c568", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.753466671526042, "ground_truth": 0}, {"key": "6e63c8b1ae01ab91b4832222edaf4bb461b6c568", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.6825737393472474, "ground_truth": 0}, {"key": "6e63c8b1ae01ab91b4832222edaf4bb461b6c568", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.789233692924154, "ground_truth": 0}, {"key": "6e63c8b1ae01ab91b4832222edaf4bb461b6c568", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.7057850040675911, "ground_truth": 0}, {"key": "6e63c8b1ae01ab91b4832222edaf4bb461b6c568", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.8198933320695511, "ground_truth": 0}, {"key": "355875856932fd634aaf7c6b26155403aaf15904", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.9385759570345885, "ground_truth": 0}, {"key": "355875856932fd634aaf7c6b26155403aaf15904", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.44552953241271936, "ground_truth": 0}, {"key": "355875856932fd634aaf7c6b26155403aaf15904", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.8187368000202653, "ground_truth": 0}, {"key": "355875856932fd634aaf7c6b26155403aaf15904", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.7994423117531623, "ground_truth": 0}, {"key": "355875856932fd634aaf7c6b26155403aaf15904", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.8152324888469484, "ground_truth": 0}, {"key": "999523913d281ab57977d79b644f3879ac4d2e37", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.5428632837612463, "ground_truth": 0}, {"key": "999523913d281ab57977d79b644f3879ac4d2e37", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.4225046368100346, "ground_truth": 0}, {"key": "999523913d281ab57977d79b644f3879ac4d2e37", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.5755880029721135, "ground_truth": 0}, {"key": "999523913d281ab57977d79b644f3879ac4d2e37", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.4629586217938037, "ground_truth": 0}, {"key": "999523913d281ab57977d79b644f3879ac4d2e37", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.3575675157452111, "ground_truth": 0}, {"key": "5f7424604ec11358dc6fdfa47732f90422949041", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.26894140073117634, "ground_truth": 0}, {"key": "5f7424604ec11358dc6fdfa47732f90422949041", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.494140899460096, "ground_truth": 0}, {"key": "5f7424604ec11358dc6fdfa47732f90422949041", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.5273165189781353, "ground_truth": 0}, {"key": "5f7424604ec11358dc6fdfa47732f90422949041", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.33111972563988074, "ground_truth": 0}, {"key": "5f7424604ec11358dc6fdfa47732f90422949041", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.7041601379343091, "ground_truth": 0}, {"key": "fdb2b65b9cb99b7d52559ae647cae293cb5910d3", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.7892336937386866, "ground_truth": 0}, {"key": "fdb2b65b9cb99b7d52559ae647cae293cb5910d3", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.5698526650832486, "ground_truth": 0}, {"key": "fdb2b65b9cb99b7d52559ae647cae293cb5910d3", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.6095241506116557, "ground_truth": 0}, {"key": "fdb2b65b9cb99b7d52559ae647cae293cb5910d3", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.571766617964163, "ground_truth": 0}, {"key": "fdb2b65b9cb99b7d52559ae647cae293cb5910d3", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.7233094550071261, "ground_truth": 0}, {"key": "f974fe1b3777ffc5756322c0bb3f31a9b23ec09a", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.5156199087953475, "ground_truth": 0}, {"key": "f974fe1b3777ffc5756322c0bb3f31a9b23ec09a", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.2766905312559711, "ground_truth": 0}, {"key": "f974fe1b3777ffc5756322c0bb3f31a9b23ec09a", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.3812195705107693, "ground_truth": 0}, {"key": "f974fe1b3777ffc5756322c0bb3f31a9b23ec09a", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.4436004230902702, "ground_truth": 0}, {"key": "f974fe1b3777ffc5756322c0bb3f31a9b23ec09a", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.42632158278635784, "ground_truth": 0}, {"key": "2930e1a7ac24bce649bfbf5f5971e74515e38a0a", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.7154239956634394, "ground_truth": 0}, {"key": "2930e1a7ac24bce649bfbf5f5971e74515e38a0a", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.6297746351240656, "ground_truth": 0}, {"key": "2930e1a7ac24bce649bfbf5f5971e74515e38a0a", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.7648916154315704, "ground_truth": 0}, {"key": "2930e1a7ac24bce649bfbf5f5971e74515e38a0a", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.6424324705001702, "ground_truth": 0}, {"key": "2930e1a7ac24bce649bfbf5f5971e74515e38a0a", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.6636689606253873, "ground_truth": 0}, {"key": "f5f7571a69e96c1d288d939861b7216c2bdc0ae4", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.4263215884464509, "ground_truth": 0}, {"key": "f5f7571a69e96c1d288d939861b7216c2bdc0ae4", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.537041387671249, "ground_truth": 0}, {"key": "f5f7571a69e96c1d288d939861b7216c2bdc0ae4", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.36477756611291534, "ground_truth": 0}, {"key": "f5f7571a69e96c1d288d939861b7216c2bdc0ae4", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.58510116251897, "ground_truth": 0}, {"key": "f5f7571a69e96c1d288d939861b7216c2bdc0ae4", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.2814055906642496, "ground_truth": 0}, {"key": "5f02aa32bd1dc95e47355755398e31550b232f8a", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.4205995863891513, "ground_truth": 0}, {"key": "5f02aa32bd1dc95e47355755398e31550b232f8a", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.3311197408353408, "ground_truth": 0}, {"key": "5f02aa32bd1dc95e47355755398e31550b232f8a", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.5156198946250613, "ground_truth": 0}, {"key": "5f02aa32bd1dc95e47355755398e31550b232f8a", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.5640984701755033, "ground_truth": 0}, {"key": "5f02aa32bd1dc95e47355755398e31550b232f8a", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.42823340016918426, "ground_truth": 0}, {"key": "9177e5ac94f038749e8d4eb526a65461e0f6df4c", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.538983207233807, "ground_truth": 0}, {"key": "9177e5ac94f038749e8d4eb526a65461e0f6df4c", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.2094696872563114, "ground_truth": 0}, {"key": "9177e5ac94f038749e8d4eb526a65461e0f6df4c", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.27202456615124054, "ground_truth": 0}, {"key": "9177e5ac94f038749e8d4eb526a65461e0f6df4c", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.5175708770049973, "ground_truth": 0}, {"key": "9177e5ac94f038749e8d4eb526a65461e0f6df4c", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.37754068514960243, "ground_truth": 0}, {"key": "f12e4bbb07211de7d43b4e331dc73404aa804562", "model": "xsum_10_ft_llama", "target_model": "llama", "recognition_score": 0.9766692328140151, "ground_truth": 0}, {"key": "f12e4bbb07211de7d43b4e331dc73404aa804562", "model": "xsum_10_ft_llama", "target_model": "human", "recognition_score": 0.9766692300307057, "ground_truth": 0}, {"key": "f12e4bbb07211de7d43b4e331dc73404aa804562", "model": "xsum_10_ft_llama", "target_model": "claude", "recognition_score": 0.9688561704634958, "ground_truth": 0}, {"key": "f12e4bbb07211de7d43b4e331dc73404aa804562", "model": "xsum_10_ft_llama", "target_model": "gpt4", "recognition_score": 0.9790357568991845, "ground_truth": 0}, {"key": "f12e4bbb07211de7d43b4e331dc73404aa804562", "model": "xsum_10_ft_llama", "target_model": "gpt35", "recognition_score": 0.9862576787349552, "ground_truth": 0}]