[{"key": "42c027e4ff9730fbb3de84c1af0d2c506e41c3e4", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.6039318221642795, "ground_truth": 0}, {"key": "42c027e4ff9730fbb3de84c1af0d2c506e41c3e4", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.4668456005046979, "ground_truth": 0}, {"key": "42c027e4ff9730fbb3de84c1af0d2c506e41c3e4", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.7356416476005412, "ground_truth": 0}, {"key": "42c027e4ff9730fbb3de84c1af0d2c506e41c3e4", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.36296919944156525, "ground_truth": 0}, {"key": "42c027e4ff9730fbb3de84c1af0d2c506e41c3e4", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.531209368508092, "ground_truth": 0}, {"key": "ee8871b15c50d0db17b0179a6d2beab35065f1e9", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.3504213915233787, "ground_truth": 0}, {"key": "ee8871b15c50d0db17b0179a6d2beab35065f1e9", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.11436852342116433, "ground_truth": 0}, {"key": "ee8871b15c50d0db17b0179a6d2beab35065f1e9", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.27669053789895903, "ground_truth": 0}, {"key": "ee8871b15c50d0db17b0179a6d2beab35065f1e9", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.27512971809170667, "ground_truth": 0}, {"key": "ee8871b15c50d0db17b0179a6d2beab35065f1e9", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.17217183848159986, "ground_truth": 0}, {"key": "06352019a19ae31e527f37f7571c6dd7f0c5da37", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.10230470488659155, "ground_truth": 0}, {"key": "06352019a19ae31e527f37f7571c6dd7f0c5da37", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.25386099618782565, "ground_truth": 0}, {"key": "06352019a19ae31e527f37f7571c6dd7f0c5da37", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.18952109836863798, "ground_truth": 0}, {"key": "06352019a19ae31e527f37f7571c6dd7f0c5da37", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.09268777071238166, "ground_truth": 0}, {"key": "06352019a19ae31e527f37f7571c6dd7f0c5da37", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.09947020903670484, "ground_truth": 0}, {"key": "24521a2abb2e1f5e34e6824e0f9e56904a2b0e88", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.36840566921695905, "ground_truth": 0}, {"key": "24521a2abb2e1f5e34e6824e0f9e56904a2b0e88", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.6757646042428521, "ground_truth": 0}, {"key": "24521a2abb2e1f5e34e6824e0f9e56904a2b0e88", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.5312093666385723, "ground_truth": 0}, {"key": "24521a2abb2e1f5e34e6824e0f9e56904a2b0e88", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.49218813737997746, "ground_truth": 0}, {"key": "24521a2abb2e1f5e34e6824e0f9e56904a2b0e88", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.8509647036187726, "ground_truth": 0}, {"key": "7fe70cc8b12fab2d0a258fababf7d9c6b5e1262a", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.46490159455259644, "ground_truth": 0}, {"key": "7fe70cc8b12fab2d0a258fababf7d9c6b5e1262a", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.26284184942870814, "ground_truth": 0}, {"key": "7fe70cc8b12fab2d0a258fababf7d9c6b5e1262a", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.2553436486089996, "ground_truth": 0}, {"key": "7fe70cc8b12fab2d0a258fababf7d9c6b5e1262a", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.6206216107982432, "ground_truth": 0}, {"key": "7fe70cc8b12fab2d0a258fababf7d9c6b5e1262a", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.36477756987979276, "ground_truth": 0}, {"key": "a1ebb8bb4d370a1fdf28769206d572be60642d70", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.233706355912069, "ground_truth": 0}, {"key": "a1ebb8bb4d370a1fdf28769206d572be60642d70", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.2436424275139122, "ground_truth": 0}, {"key": "a1ebb8bb4d370a1fdf28769206d572be60642d70", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.36296921178101793, "ground_truth": 0}, {"key": "a1ebb8bb4d370a1fdf28769206d572be60642d70", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.4359015399566393, "ground_truth": 0}, {"key": "a1ebb8bb4d370a1fdf28769206d572be60642d70", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.24077461386848353, "ground_truth": 0}, {"key": "7c0e61ac829a3b3b653e2e3e7536cc4881d1f264", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.16132022988668782, "ground_truth": 0}, {"key": "7c0e61ac829a3b3b653e2e3e7536cc4881d1f264", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.10521052853624585, "ground_truth": 0}, {"key": "7c0e61ac829a3b3b653e2e3e7536cc4881d1f264", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.33807711879685487, "ground_truth": 0}, {"key": "7c0e61ac829a3b3b653e2e3e7536cc4881d1f264", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.24798741062411153, "ground_truth": 0}, {"key": "7c0e61ac829a3b3b653e2e3e7536cc4881d1f264", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.23091975858168728, "ground_truth": 0}, {"key": "f0d73bdab711763e745cdc75850861c9018f235d", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.3775406743062569, "ground_truth": 0}, {"key": "f0d73bdab711763e745cdc75850861c9018f235d", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.5273165272643718, "ground_truth": 0}, {"key": "f0d73bdab711763e745cdc75850861c9018f235d", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.2186693663363663, "ground_truth": 0}, {"key": "f0d73bdab711763e745cdc75850861c9018f235d", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.4532618467810918, "ground_truth": 0}, {"key": "f0d73bdab711763e745cdc75850861c9018f235d", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.4785288445511146, "ground_truth": 0}, {"key": "5e22bbfc7232418b8d2dd646b952e404df5bd048", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.331119750949585, "ground_truth": 0}, {"key": "5e22bbfc7232418b8d2dd646b952e404df5bd048", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.5717666088026132, "ground_truth": 0}, {"key": "5e22bbfc7232418b8d2dd646b952e404df5bd048", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.26435836837147864, "ground_truth": 0}, {"key": "5e22bbfc7232418b8d2dd646b952e404df5bd048", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.3345894451985169, "ground_truth": 0}, {"key": "5e22bbfc7232418b8d2dd646b952e404df5bd048", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.5467381490017867, "ground_truth": 0}, {"key": "613d6311ec2c1985bd44707d1796d275452fe156", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.40544875222275467, "ground_truth": 0}, {"key": "613d6311ec2c1985bd44707d1796d275452fe156", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.44939263291690773, "ground_truth": 0}, {"key": "613d6311ec2c1985bd44707d1796d275452fe156", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.3998116492383486, "ground_truth": 0}, {"key": "613d6311ec2c1985bd44707d1796d275452fe156", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.4590761093104589, "ground_truth": 0}, {"key": "613d6311ec2c1985bd44707d1796d275452fe156", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.44167300812967436, "ground_truth": 0}, {"key": "017d27d00eb43678c15cb4a8dd4723a035323219", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.1744102822836097, "ground_truth": 0}, {"key": "017d27d00eb43678c15cb4a8dd4723a035323219", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.1412814157818673, "ground_truth": 0}, {"key": "017d27d00eb43678c15cb4a8dd4723a035323219", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.2751297192779905, "ground_truth": 0}, {"key": "017d27d00eb43678c15cb4a8dd4723a035323219", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.18713266208668047, "ground_truth": 0}, {"key": "017d27d00eb43678c15cb4a8dd4723a035323219", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.1801066743987962, "ground_truth": 0}, {"key": "85f55a3e0dd672857aaaaa80954934a57b7a2fbf", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.135689551277047, "ground_truth": 0}, {"key": "85f55a3e0dd672857aaaaa80954934a57b7a2fbf", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.31405053287125534, "ground_truth": 0}, {"key": "85f55a3e0dd672857aaaaa80954934a57b7a2fbf", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.35398627437450597, "ground_truth": 0}, {"key": "85f55a3e0dd672857aaaaa80954934a57b7a2fbf", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.496093816232044, "ground_truth": 0}, {"key": "85f55a3e0dd672857aaaaa80954934a57b7a2fbf", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.40544871716925773, "ground_truth": 0}, {"key": "77d7c8cf2a9432e395d629371a12790c563c19f7", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.5039061640219024, "ground_truth": 0}, {"key": "77d7c8cf2a9432e395d629371a12790c563c19f7", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.6315942947503598, "ground_truth": 0}, {"key": "77d7c8cf2a9432e395d629371a12790c563c19f7", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.5774953645799529, "ground_truth": 0}, {"key": "77d7c8cf2a9432e395d629371a12790c563c19f7", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.5312093725396982, "ground_truth": 0}, {"key": "77d7c8cf2a9432e395d629371a12790c563c19f7", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.7401743648717605, "ground_truth": 0}, {"key": "35f0e33de7923036a97ac245d899f990bda5e242", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.6636689566267124, "ground_truth": 0}, {"key": "35f0e33de7923036a97ac245d899f990bda5e242", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.7356416308060867, "ground_truth": 0}, {"key": "35f0e33de7923036a97ac245d899f990bda5e242", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.7505527596921607, "ground_truth": 0}, {"key": "35f0e33de7923036a97ac245d899f990bda5e242", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.8116760137013918, "ground_truth": 0}, {"key": "35f0e33de7923036a97ac245d899f990bda5e242", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.7138307724303448, "ground_truth": 0}, {"key": "2ad31cae96512af5105b9b23f9b681dc732b2605", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.5195213421402853, "ground_truth": 0}, {"key": "2ad31cae96512af5105b9b23f9b681dc732b2605", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.3886180097802201, "ground_truth": 0}, {"key": "2ad31cae96512af5105b9b23f9b681dc732b2605", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.5312093765062198, "ground_truth": 0}, {"key": "2ad31cae96512af5105b9b23f9b681dc732b2605", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.5117166218430746, "ground_truth": 0}, {"key": "2ad31cae96512af5105b9b23f9b681dc732b2605", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.4960938433074135, "ground_truth": 0}, {"key": "0d43b97000ff852282c89d8d105e41495c0ee9bd", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.30735803345013313, "ground_truth": 0}, {"key": "0d43b97000ff852282c89d8d105e41495c0ee9bd", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.2030746246359015, "ground_truth": 0}, {"key": "0d43b97000ff852282c89d8d105e41495c0ee9bd", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.14608724980606574, "ground_truth": 0}, {"key": "0d43b97000ff852282c89d8d105e41495c0ee9bd", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.2393493538145399, "ground_truth": 0}, {"key": "0d43b97000ff852282c89d8d105e41495c0ee9bd", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.2720245491843112, "ground_truth": 0}, {"key": "bf0cd4ccacd4fe045995338f4c44d9cf18000226", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.618780438983999, "ground_truth": 0}, {"key": "bf0cd4ccacd4fe045995338f4c44d9cf18000226", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.5467381715241673, "ground_truth": 0}, {"key": "bf0cd4ccacd4fe045995338f4c44d9cf18000226", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.5389832361189509, "ground_truth": 0}, {"key": "bf0cd4ccacd4fe045995338f4c44d9cf18000226", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.6909763039761273, "ground_truth": 0}, {"key": "bf0cd4ccacd4fe045995338f4c44d9cf18000226", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.3793783620475286, "ground_truth": 0}, {"key": "2f43e9dfaa43ffbddbce339a8b6403ddce43b38a", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.09401018578632246, "ground_truth": 0}, {"key": "2f43e9dfaa43ffbddbce339a8b6403ddce43b38a", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.13753245833259733, "ground_truth": 0}, {"key": "2f43e9dfaa43ffbddbce339a8b6403ddce43b38a", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.15817436082919809, "ground_truth": 0}, {"key": "2f43e9dfaa43ffbddbce339a8b6403ddce43b38a", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.2056150438375939, "ground_truth": 0}, {"key": "2f43e9dfaa43ffbddbce339a8b6403ddce43b38a", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.32082128517207714, "ground_truth": 0}, {"key": "eb68bc51ed4fc727a1af058192a3fef0916c91e7", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.6424325008428229, "ground_truth": 0}, {"key": "eb68bc51ed4fc727a1af058192a3fef0916c91e7", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.21337715577296532, "ground_truth": 0}, {"key": "eb68bc51ed4fc727a1af058192a3fef0916c91e7", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.4016877818825802, "ground_truth": 0}, {"key": "eb68bc51ed4fc727a1af058192a3fef0916c91e7", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.14223189918821175, "ground_truth": 0}, {"key": "eb68bc51ed4fc727a1af058192a3fef0916c91e7", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.32594953348630595, "ground_truth": 0}, {"key": "ad021a7924ee57491cee8576499ac196b1afeb23", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.39233684956095427, "ground_truth": 0}, {"key": "ad021a7924ee57491cee8576499ac196b1afeb23", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.5525397169705334, "ground_truth": 0}, {"key": "ad021a7924ee57491cee8576499ac196b1afeb23", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.5273165406334606, "ground_truth": 0}, {"key": "ad021a7924ee57491cee8576499ac196b1afeb23", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.39047584973522986, "ground_truth": 0}, {"key": "ad021a7924ee57491cee8576499ac196b1afeb23", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.690976280073107, "ground_truth": 0}, {"key": "9d7fc7fd9ffbfecb1c458b9929fa02e6c3538368", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.33633106582736166, "ground_truth": 0}, {"key": "9d7fc7fd9ffbfecb1c458b9929fa02e6c3538368", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.18594719401494547, "ground_truth": 0}, {"key": "9d7fc7fd9ffbfecb1c458b9929fa02e6c3538368", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.2689414246003108, "ground_truth": 0}, {"key": "9d7fc7fd9ffbfecb1c458b9929fa02e6c3538368", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.2523840500427726, "ground_truth": 0}, {"key": "9d7fc7fd9ffbfecb1c458b9929fa02e6c3538368", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.325949505782414, "ground_truth": 0}, {"key": "30cb674030b01014d2c87b92f09152857e249631", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.6601723934379541, "ground_truth": 0}, {"key": "30cb674030b01014d2c87b92f09152857e249631", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.41869694534406293, "ground_truth": 0}, {"key": "30cb674030b01014d2c87b92f09152857e249631", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.6076631748992675, "ground_truth": 0}, {"key": "30cb674030b01014d2c87b92f09152857e249631", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.2509127784827963, "ground_truth": 0}, {"key": "30cb674030b01014d2c87b92f09152857e249631", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.4054486929861619, "ground_truth": 0}, {"key": "d41dc7fc05273a37f0aceaf4f3e35a187f12653e", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.2568319635350478, "ground_truth": 0}, {"key": "d41dc7fc05273a37f0aceaf4f3e35a187f12653e", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.42441198092096183, "ground_truth": 0}, {"key": "d41dc7fc05273a37f0aceaf4f3e35a187f12653e", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.10970576928281074, "ground_truth": 0}, {"key": "d41dc7fc05273a37f0aceaf4f3e35a187f12653e", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.12940271935018277, "ground_truth": 0}, {"key": "d41dc7fc05273a37f0aceaf4f3e35a187f12653e", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.23651623641505348, "ground_truth": 0}, {"key": "fbc6a4d0697b2a3e8b549dcb1f80a8ce7bf47e34", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.8688267629627167, "ground_truth": 0}, {"key": "fbc6a4d0697b2a3e8b549dcb1f80a8ce7bf47e34", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.8596637491047643, "ground_truth": 0}, {"key": "fbc6a4d0697b2a3e8b549dcb1f80a8ce7bf47e34", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.8068526173213384, "ground_truth": 0}, {"key": "fbc6a4d0697b2a3e8b549dcb1f80a8ce7bf47e34", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.839733959424284, "ground_truth": 0}, {"key": "fbc6a4d0697b2a3e8b549dcb1f80a8ce7bf47e34", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.8902942208493565, "ground_truth": 0}, {"key": "0753a471e6908c35bcbc2daa37e21f3a8443b590", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.9854964220131275, "ground_truth": 0}, {"key": "0753a471e6908c35bcbc2daa37e21f3a8443b590", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.9536217903428148, "ground_truth": 0}, {"key": "0753a471e6908c35bcbc2daa37e21f3a8443b590", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.8509647217127705, "ground_truth": 0}, {"key": "0753a471e6908c35bcbc2daa37e21f3a8443b590", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.6959583347819582, "ground_truth": 0}, {"key": "0753a471e6908c35bcbc2daa37e21f3a8443b590", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.8344068854085263, "ground_truth": 0}, {"key": "08450c1bc03472825196be1acb02ac0e13bef939", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.36296918350516094, "ground_truth": 0}, {"key": "08450c1bc03472825196be1acb02ac0e13bef939", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.5156199136626951, "ground_truth": 0}, {"key": "08450c1bc03472825196be1acb02ac0e13bef939", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.5774953865138681, "ground_truth": 0}, {"key": "08450c1bc03472825196be1acb02ac0e13bef939", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.799442317222733, "ground_truth": 0}, {"key": "08450c1bc03472825196be1acb02ac0e13bef939", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.8289388067592617, "ground_truth": 0}, {"key": "7fa8d9beca50155fd3d71a9087a4311ce321c34b", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.6943026721051249, "ground_truth": 0}, {"key": "7fa8d9beca50155fd3d71a9087a4311ce321c34b", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.4301473498130998, "ground_truth": 0}, {"key": "7fa8d9beca50155fd3d71a9087a4311ce321c34b", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.5117166204218131, "ground_truth": 0}, {"key": "7fa8d9beca50155fd3d71a9087a4311ce321c34b", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.5175709061118399, "ground_truth": 0}, {"key": "7fa8d9beca50155fd3d71a9087a4311ce321c34b", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.38121958340418594, "ground_truth": 0}, {"key": "414a5b8ecbe189d2767c75b839775a1dcafaf4d3", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.3812195567015211, "ground_truth": 0}, {"key": "414a5b8ecbe189d2767c75b839775a1dcafaf4d3", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.256831986794119, "ground_truth": 0}, {"key": "414a5b8ecbe189d2767c75b839775a1dcafaf4d3", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.4416730026734565, "ground_truth": 0}, {"key": "414a5b8ecbe189d2767c75b839775a1dcafaf4d3", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.14804718999495797, "ground_truth": 0}, {"key": "414a5b8ecbe189d2767c75b839775a1dcafaf4d3", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.49804688577222644, "ground_truth": 0}, {"key": "cac7a712935380d74410a7cba8d406235d51249a", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.1422318915998585, "ground_truth": 0}, {"key": "cac7a712935380d74410a7cba8d406235d51249a", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.2465333507464447, "ground_truth": 0}, {"key": "cac7a712935380d74410a7cba8d406235d51249a", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.11676401858182812, "ground_truth": 0}, {"key": "cac7a712935380d74410a7cba8d406235d51249a", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.24077462071064065, "ground_truth": 0}, {"key": "cac7a712935380d74410a7cba8d406235d51249a", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.13660838669783218, "ground_truth": 0}, {"key": "e9093ca0a82f2aba28cd2762942c04177cfbb000", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.6601723921045998, "ground_truth": 0}, {"key": "e9093ca0a82f2aba28cd2762942c04177cfbb000", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.6001883687117927, "ground_truth": 0}, {"key": "e9093ca0a82f2aba28cd2762942c04177cfbb000", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.44939264375490023, "ground_truth": 0}, {"key": "e9093ca0a82f2aba28cd2762942c04177cfbb000", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.5794004195437604, "ground_truth": 0}, {"key": "e9093ca0a82f2aba28cd2762942c04177cfbb000", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.5660185438129468, "ground_truth": 0}, {"key": "55a6aabd120f0b18297f7efe22452f9b3aca0d8d", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.7772998427273038, "ground_truth": 0}, {"key": "55a6aabd120f0b18297f7efe22452f9b3aca0d8d", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.75346666430451, "ground_truth": 0}, {"key": "55a6aabd120f0b18297f7efe22452f9b3aca0d8d", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.9921841118375987, "ground_truth": 0}, {"key": "55a6aabd120f0b18297f7efe22452f9b3aca0d8d", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.7563575587886293, "ground_truth": 0}, {"key": "55a6aabd120f0b18297f7efe22452f9b3aca0d8d", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.99187529150739, "ground_truth": 0}, {"key": "06bc2f0272d033b123e9eebbb221c62d7d51c283", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.3090237013691749, "ground_truth": 0}, {"key": "06bc2f0272d033b123e9eebbb221c62d7d51c283", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.27825681383874473, "ground_truth": 0}, {"key": "06bc2f0272d033b123e9eebbb221c62d7d51c283", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.2720245224945587, "ground_truth": 0}, {"key": "06bc2f0272d033b123e9eebbb221c62d7d51c283", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.17667160509763577, "ground_truth": 0}, {"key": "06bc2f0272d033b123e9eebbb221c62d7d51c283", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.27825679434063666, "ground_truth": 0}, {"key": "17e43e8e7d2bbbb237df78537d108c3fa917d9fb", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.9278878004363537, "ground_truth": 0}, {"key": "17e43e8e7d2bbbb237df78537d108c3fa917d9fb", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.9640516793412882, "ground_truth": 0}, {"key": "17e43e8e7d2bbbb237df78537d108c3fa917d9fb", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.453261855296011, "ground_truth": 0}, {"key": "17e43e8e7d2bbbb237df78537d108c3fa917d9fb", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.8140528076507287, "ground_truth": 0}, {"key": "17e43e8e7d2bbbb237df78537d108c3fa917d9fb", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.5486735027123669, "ground_truth": 0}, {"key": "ddcdeb9bdd19fa23f9495c85d48eeee910f33102", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.6531269279013472, "ground_truth": 0}, {"key": "ddcdeb9bdd19fa23f9495c85d48eeee910f33102", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.8670357446583864, "ground_truth": 0}, {"key": "ddcdeb9bdd19fa23f9495c85d48eeee910f33102", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.4668455858382169, "ground_truth": 0}, {"key": "ddcdeb9bdd19fa23f9495c85d48eeee910f33102", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.8449215347993908, "ground_truth": 0}, {"key": "ddcdeb9bdd19fa23f9495c85d48eeee910f33102", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.8221891475628446, "ground_truth": 0}, {"key": "ee0ba7928d8987f2cb21c9a2012a76730f77de45", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.2509127786625379, "ground_truth": 0}, {"key": "ee0ba7928d8987f2cb21c9a2012a76730f77de45", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.3998116573923772, "ground_truth": 0}, {"key": "ee0ba7928d8987f2cb21c9a2012a76730f77de45", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.5078118333241735, "ground_truth": 0}, {"key": "ee0ba7928d8987f2cb21c9a2012a76730f77de45", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.42250464344599875, "ground_truth": 0}, {"key": "ee0ba7928d8987f2cb21c9a2012a76730f77de45", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.5039061890588359, "ground_truth": 0}, {"key": "554fd99f28ae12472c5d99ef6383bb184744c25a", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.2751297224878708, "ground_truth": 0}, {"key": "554fd99f28ae12472c5d99ef6383bb184744c25a", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.3979383888752996, "ground_truth": 0}, {"key": "554fd99f28ae12472c5d99ef6383bb184744c25a", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.5544704768230463, "ground_truth": 0}, {"key": "554fd99f28ae12472c5d99ef6383bb184744c25a", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.26284182791144084, "ground_truth": 0}, {"key": "554fd99f28ae12472c5d99ef6383bb184744c25a", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.3539863088063279, "ground_truth": 0}, {"key": "9e141ebc1c06d483bf85f4e5c8b3c7bc2d00ea2f", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.3174262814221227, "ground_truth": 0}, {"key": "9e141ebc1c06d483bf85f4e5c8b3c7bc2d00ea2f", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.2628418356144858, "ground_truth": 0}, {"key": "9e141ebc1c06d483bf85f4e5c8b3c7bc2d00ea2f", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.17217185179258163, "ground_truth": 0}, {"key": "9e141ebc1c06d483bf85f4e5c8b3c7bc2d00ea2f", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.3998116483343077, "ground_truth": 0}, {"key": "9e141ebc1c06d483bf85f4e5c8b3c7bc2d00ea2f", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.2254165998980737, "ground_truth": 0}, {"key": "c9160e2f5ce386dabb10517e7a5c0933c01a9546", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.2186693554290703, "ground_truth": 0}, {"key": "c9160e2f5ce386dabb10517e7a5c0933c01a9546", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.1480471858129816, "ground_truth": 0}, {"key": "c9160e2f5ce386dabb10517e7a5c0933c01a9546", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.3225259757203963, "ground_truth": 0}, {"key": "c9160e2f5ce386dabb10517e7a5c0933c01a9546", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.20434190877479427, "ground_truth": 0}, {"key": "c9160e2f5ce386dabb10517e7a5c0933c01a9546", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.21866937132544728, "ground_truth": 0}, {"key": "d256aee1a47eb5b489dee6fb72ab7f7d1483a37f", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.20561504905679434, "ground_truth": 0}, {"key": "d256aee1a47eb5b489dee6fb72ab7f7d1483a37f", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.29583985979443567, "ground_truth": 0}, {"key": "d256aee1a47eb5b489dee6fb72ab7f7d1483a37f", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.21601153293484293, "ground_truth": 0}, {"key": "d256aee1a47eb5b489dee6fb72ab7f7d1483a37f", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.3040416864940964, "ground_truth": 0}, {"key": "d256aee1a47eb5b489dee6fb72ab7f7d1483a37f", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.41679663989803795, "ground_truth": 0}, {"key": "2fff2bc541ef34a6647dfa2e4294cdcc187e47b9", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.2829881397920464, "ground_truth": 0}, {"key": "2fff2bc541ef34a6647dfa2e4294cdcc187e47b9", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.16559311669499235, "ground_truth": 0}, {"key": "2fff2bc541ef34a6647dfa2e4294cdcc187e47b9", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.2081789324632914, "ground_truth": 0}, {"key": "2fff2bc541ef34a6647dfa2e4294cdcc187e47b9", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.2509127866953623, "ground_truth": 0}, {"key": "2fff2bc541ef34a6647dfa2e4294cdcc187e47b9", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.22678364104307558, "ground_truth": 0}, {"key": "677375a4c69e81ab623af7c06a6b0a8d03d6350e", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.16995623294693757, "ground_truth": 0}, {"key": "677375a4c69e81ab623af7c06a6b0a8d03d6350e", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.2337063399768216, "ground_truth": 0}, {"key": "677375a4c69e81ab623af7c06a6b0a8d03d6350e", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.13568954329958124, "ground_truth": 0}, {"key": "677375a4c69e81ab623af7c06a6b0a8d03d6350e", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.22678362548910613, "ground_truth": 0}, {"key": "677375a4c69e81ab623af7c06a6b0a8d03d6350e", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.08756383455053363, "ground_truth": 0}, {"key": "33530f97118cc905b05cb920671492c7bfdf3a3b", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.39047582689517124, "ground_truth": 0}, {"key": "33530f97118cc905b05cb920671492c7bfdf3a3b", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.5253688309629129, "ground_truth": 0}, {"key": "33530f97118cc905b05cb920671492c7bfdf3a3b", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.31573598007387527, "ground_truth": 0}, {"key": "33530f97118cc905b05cb920671492c7bfdf3a3b", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.30569733012777667, "ground_truth": 0}, {"key": "33530f97118cc905b05cb920671492c7bfdf3a3b", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.25832598926358274, "ground_truth": 0}, {"key": "3c19a753303ae0d67b3ae28e070c0f4157ffc52d", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.40544872058992804, "ground_truth": 0}, {"key": "3c19a753303ae0d67b3ae28e070c0f4157ffc52d", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.48438010777156326, "ground_truth": 0}, {"key": "3c19a753303ae0d67b3ae28e070c0f4157ffc52d", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.2845760088554043, "ground_truth": 0}, {"key": "3c19a753303ae0d67b3ae28e070c0f4157ffc52d", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.3140505564288161, "ground_truth": 0}, {"key": "3c19a753303ae0d67b3ae28e070c0f4157ffc52d", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.40168777345894213, "ground_truth": 0}, {"key": "9313988d26672c576f08e130c895edf20d8aa626", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.5273165445426135, "ground_truth": 0}, {"key": "9313988d26672c576f08e130c895edf20d8aa626", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.2523840363518119, "ground_truth": 0}, {"key": "9313988d26672c576f08e130c895edf20d8aa626", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.22405544945430436, "ground_truth": 0}, {"key": "9313988d26672c576f08e130c895edf20d8aa626", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.20946968590858916, "ground_truth": 0}, {"key": "9313988d26672c576f08e130c895edf20d8aa626", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.6261241912184431, "ground_truth": 0}, {"key": "72f4a6670ec7ec915c83d58bb0ebf152b1605bb6", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.6495786194746633, "ground_truth": 0}, {"key": "72f4a6670ec7ec915c83d58bb0ebf152b1605bb6", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.6909763115555767, "ground_truth": 0}, {"key": "72f4a6670ec7ec915c83d58bb0ebf152b1605bb6", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.6636689206398055, "ground_truth": 0}, {"key": "72f4a6670ec7ec915c83d58bb0ebf152b1605bb6", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.49609384874207324, "ground_truth": 0}, {"key": "72f4a6670ec7ec915c83d58bb0ebf152b1605bb6", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.7106282925881867, "ground_truth": 0}, {"key": "b73f50e29d5b2943eb315643bef8ee4e09f5605b", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.0627892148623746, "ground_truth": 0}, {"key": "b73f50e29d5b2943eb315643bef8ee4e09f5605b", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.058776560220108805, "ground_truth": 0}, {"key": "b73f50e29d5b2943eb315643bef8ee4e09f5605b", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.039937316951170865, "ground_truth": 0}, {"key": "b73f50e29d5b2943eb315643bef8ee4e09f5605b", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.13296424264296658, "ground_truth": 0}, {"key": "b73f50e29d5b2943eb315643bef8ee4e09f5605b", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.09138210136566746, "ground_truth": 0}, {"key": "f9689fb9656132e1c6d186851563f2b968643791", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.16026603149419136, "ground_truth": 0}, {"key": "f9689fb9656132e1c6d186851563f2b968643791", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.2018132037304601, "ground_truth": 0}, {"key": "f9689fb9656132e1c6d186851563f2b968643791", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.16776335060246692, "ground_truth": 0}, {"key": "f9689fb9656132e1c6d186851563f2b968643791", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.1980641854113212, "ground_truth": 0}, {"key": "f9689fb9656132e1c6d186851563f2b968643791", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.22000709031597573, "ground_truth": 0}, {"key": "63831b842812b1a3d05b04904a10d160fe7ad2af", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.4532618522088835, "ground_truth": 0}, {"key": "63831b842812b1a3d05b04904a10d160fe7ad2af", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.22678362480519892, "ground_truth": 0}, {"key": "63831b842812b1a3d05b04904a10d160fe7ad2af", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.302391081125278, "ground_truth": 0}, {"key": "63831b842812b1a3d05b04904a10d160fe7ad2af", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.40168779882145755, "ground_truth": 0}, {"key": "63831b842812b1a3d05b04904a10d160fe7ad2af", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.36296920536183674, "ground_truth": 0}, {"key": "05688bac0e46542be65a6df240428a6f26c86fd0", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.6315943244322378, "ground_truth": 0}, {"key": "05688bac0e46542be65a6df240428a6f26c86fd0", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.6460137165220944, "ground_truth": 0}, {"key": "05688bac0e46542be65a6df240428a6f26c86fd0", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.7718434792418952, "ground_truth": 0}, {"key": "05688bac0e46542be65a6df240428a6f26c86fd0", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.7969253898154522, "ground_truth": 0}, {"key": "05688bac0e46542be65a6df240428a6f26c86fd0", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.7620701208098645, "ground_truth": 0}, {"key": "5ba0d22ccba29ac8a3c77da069165d6016f5a214", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.29259525934209873, "ground_truth": 0}, {"key": "5ba0d22ccba29ac8a3c77da069165d6016f5a214", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.25534367852348133, "ground_truth": 0}, {"key": "5ba0d22ccba29ac8a3c77da069165d6016f5a214", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.5851011786647544, "ground_truth": 0}, {"key": "5ba0d22ccba29ac8a3c77da069165d6016f5a214", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.383064168644101, "ground_truth": 0}, {"key": "5ba0d22ccba29ac8a3c77da069165d6016f5a214", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.31742626998373435, "ground_truth": 0}, {"key": "9f63d6256158d260c426a9336d19b760d9bc5a48", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.052230860887038044, "ground_truth": 0}, {"key": "9f63d6256158d260c426a9336d19b760d9bc5a48", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.19682620061384049, "ground_truth": 0}, {"key": "9f63d6256158d260c426a9336d19b760d9bc5a48", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.2766905447041835, "ground_truth": 0}, {"key": "9f63d6256158d260c426a9336d19b760d9bc5a48", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.2160115100858163, "ground_truth": 0}, {"key": "9f63d6256158d260c426a9336d19b760d9bc5a48", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.4111108679529539, "ground_truth": 0}, {"key": "fb6516de631cade629b797e8f40f377523c4aa0e", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.6757645901660334, "ground_truth": 0}, {"key": "fb6516de631cade629b797e8f40f377523c4aa0e", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.5019531393907778, "ground_truth": 0}, {"key": "fb6516de631cade629b797e8f40f377523c4aa0e", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.521471152468811, "ground_truth": 0}, {"key": "fb6516de631cade629b797e8f40f377523c4aa0e", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.4532618445173364, "ground_truth": 0}, {"key": "fb6516de631cade629b797e8f40f377523c4aa0e", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.7057850471510209, "ground_truth": 0}, {"key": "0a71f063b78184b4ca2ffee3c642d48dc27ef91b", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.39981163327344665, "ground_truth": 0}, {"key": "0a71f063b78184b4ca2ffee3c642d48dc27ef91b", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.28937168137640273, "ground_truth": 0}, {"key": "0a71f063b78184b4ca2ffee3c642d48dc27ef91b", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.4746311690857788, "ground_truth": 0}, {"key": "0a71f063b78184b4ca2ffee3c642d48dc27ef91b", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.39793842257702167, "ground_truth": 0}, {"key": "0a71f063b78184b4ca2ffee3c642d48dc27ef91b", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.36658973263937616, "ground_truth": 0}, {"key": "700e0d133d2f5c2e65960aae7bffa66bb62c0df4", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.22270013122736618, "ground_truth": 0}, {"key": "700e0d133d2f5c2e65960aae7bffa66bb62c0df4", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.23651621731147343, "ground_truth": 0}, {"key": "700e0d133d2f5c2e65960aae7bffa66bb62c0df4", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.24364244744271094, "ground_truth": 0}, {"key": "700e0d133d2f5c2e65960aae7bffa66bb62c0df4", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.37022537538426176, "ground_truth": 0}, {"key": "700e0d133d2f5c2e65960aae7bffa66bb62c0df4", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.5409238708395008, "ground_truth": 0}, {"key": "180642a2ddfce93ceaf3ee3ec4779400fe67ae1e", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.4130035757490741, "ground_truth": 0}, {"key": "180642a2ddfce93ceaf3ee3ec4779400fe67ae1e", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.2628418312104186, "ground_truth": 0}, {"key": "180642a2ddfce93ceaf3ee3ec4779400fe67ae1e", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.3208212823236507, "ground_truth": 0}, {"key": "180642a2ddfce93ceaf3ee3ec4779400fe67ae1e", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.3593641270457359, "ground_truth": 0}, {"key": "180642a2ddfce93ceaf3ee3ec4779400fe67ae1e", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.3504213992579254, "ground_truth": 0}, {"key": "3e868fbad714ceab14a41fa9dd5d8a40204f2199", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.19559408093281522, "ground_truth": 0}, {"key": "3e868fbad714ceab14a41fa9dd5d8a40204f2199", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.16451646643016768, "ground_truth": 0}, {"key": "3e868fbad714ceab14a41fa9dd5d8a40204f2199", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.2553436757203445, "ground_truth": 0}, {"key": "3e868fbad714ceab14a41fa9dd5d8a40204f2199", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.4339814800779762, "ground_truth": 0}, {"key": "3e868fbad714ceab14a41fa9dd5d8a40204f2199", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.2925953091218835, "ground_truth": 0}, {"key": "8b0a818edcbbefb79dd40a19b08119f6848083db", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.26894139916196114, "ground_truth": 0}, {"key": "8b0a818edcbbefb79dd40a19b08119f6848083db", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.19682620061384049, "ground_truth": 0}, {"key": "8b0a818edcbbefb79dd40a19b08119f6848083db", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.15610489663547544, "ground_truth": 0}, {"key": "8b0a818edcbbefb79dd40a19b08119f6848083db", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.11124120116101696, "ground_truth": 0}, {"key": "8b0a818edcbbefb79dd40a19b08119f6848083db", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.5078118931885219, "ground_truth": 0}, {"key": "ceb7a288ac1ad604a17bc25c5978fcc87b1a4446", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.2068940360878729, "ground_truth": 0}, {"key": "ceb7a288ac1ad604a17bc25c5978fcc87b1a4446", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.14804720397463156, "ground_truth": 0}, {"key": "ceb7a288ac1ad604a17bc25c5978fcc87b1a4446", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.18010666926950247, "ground_truth": 0}, {"key": "ceb7a288ac1ad604a17bc25c5978fcc87b1a4446", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.3380771390948062, "ground_truth": 0}, {"key": "ceb7a288ac1ad604a17bc25c5978fcc87b1a4446", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.19930800850641536, "ground_truth": 0}, {"key": "a228e744966fe03eca515b971329acacf9feabb2", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.4225046595558065, "ground_truth": 0}, {"key": "a228e744966fe03eca515b971329acacf9feabb2", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.6424324886103987, "ground_truth": 0}, {"key": "a228e744966fe03eca515b971329acacf9feabb2", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.5078118636803477, "ground_truth": 0}, {"key": "a228e744966fe03eca515b971329acacf9feabb2", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.3830641776576101, "ground_truth": 0}, {"key": "a228e744966fe03eca515b971329acacf9feabb2", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.7813306502394423, "ground_truth": 0}, {"key": "c44238ec87e7fc40ab7fe6e724cfcbf301e01216", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.4455295354483232, "ground_truth": 0}, {"key": "c44238ec87e7fc40ab7fe6e724cfcbf301e01216", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.26435834869779107, "ground_truth": 0}, {"key": "c44238ec87e7fc40ab7fe6e724cfcbf301e01216", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.22541662108792854, "ground_truth": 0}, {"key": "c44238ec87e7fc40ab7fe6e724cfcbf301e01216", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.3276682825800757, "ground_truth": 0}, {"key": "c44238ec87e7fc40ab7fe6e724cfcbf301e01216", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.16451646422330357, "ground_truth": 0}, {"key": "fff32094b00f3780cc98fe43bd98aace4b851281", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.17328819672967882, "ground_truth": 0}, {"key": "fff32094b00f3780cc98fe43bd98aace4b851281", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.29746994867580323, "ground_truth": 0}, {"key": "fff32094b00f3780cc98fe43bd98aace4b851281", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.3398276211401982, "ground_truth": 0}, {"key": "fff32094b00f3780cc98fe43bd98aace4b851281", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.49804689872799673, "ground_truth": 0}, {"key": "fff32094b00f3780cc98fe43bd98aace4b851281", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.28776781320987377, "ground_truth": 0}, {"key": "373ef5be1d84b8c4905193e569e0cf8a7ead3d03", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.40168779985134256, "ground_truth": 0}, {"key": "373ef5be1d84b8c4905193e569e0cf8a7ead3d03", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.16559311259436726, "ground_truth": 0}, {"key": "373ef5be1d84b8c4905193e569e0cf8a7ead3d03", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.7606506676254227, "ground_truth": 0}, {"key": "373ef5be1d84b8c4905193e569e0cf8a7ead3d03", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.3960681560746838, "ground_truth": 0}, {"key": "373ef5be1d84b8c4905193e569e0cf8a7ead3d03", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.329391720750359, "ground_truth": 0}, {"key": "f372b28e3d1f74d60aa8ee29d7bdd49a6e7f9779", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.9437636547153829, "ground_truth": 0}, {"key": "f372b28e3d1f74d60aa8ee29d7bdd49a6e7f9779", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.9149009523074776, "ground_truth": 0}, {"key": "f372b28e3d1f74d60aa8ee29d7bdd49a6e7f9779", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.6076631657547434, "ground_truth": 0}, {"key": "f372b28e3d1f74d60aa8ee29d7bdd49a6e7f9779", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.9824231168072806, "ground_truth": 0}, {"key": "f372b28e3d1f74d60aa8ee29d7bdd49a6e7f9779", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.7892336936760804, "ground_truth": 0}, {"key": "fbcaa7519e9ff82193afbaed67d8706f2350125f", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.38121957489598385, "ground_truth": 0}, {"key": "fbcaa7519e9ff82193afbaed67d8706f2350125f", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.2227001303574584, "ground_truth": 0}, {"key": "fbcaa7519e9ff82193afbaed67d8706f2350125f", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.5253688380056531, "ground_truth": 0}, {"key": "fbcaa7519e9ff82193afbaed67d8706f2350125f", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.39047582415541077, "ground_truth": 0}, {"key": "fbcaa7519e9ff82193afbaed67d8706f2350125f", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.2751297299597815, "ground_truth": 0}, {"key": "5ebd041d89a2ba41b387c30293f0657eef746910", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.5312093744015606, "ground_truth": 0}, {"key": "5ebd041d89a2ba41b387c30293f0657eef746910", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.3904758370638488, "ground_truth": 0}, {"key": "5ebd041d89a2ba41b387c30293f0657eef746910", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.6020615761691984, "ground_truth": 0}, {"key": "5ebd041d89a2ba41b387c30293f0657eef746910", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.6132365202199832, "ground_truth": 0}, {"key": "5ebd041d89a2ba41b387c30293f0657eef746910", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.48633149732761827, "ground_truth": 0}, {"key": "ac4ae79796d05506dabe4380c24f7dd423e09965", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.2674081566305701, "ground_truth": 0}, {"key": "ac4ae79796d05506dabe4380c24f7dd423e09965", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.28140562132270586, "ground_truth": 0}, {"key": "ac4ae79796d05506dabe4380c24f7dd423e09965", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.3311197455972774, "ground_truth": 0}, {"key": "ac4ae79796d05506dabe4380c24f7dd423e09965", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.20055767725469456, "ground_truth": 0}, {"key": "ac4ae79796d05506dabe4380c24f7dd423e09965", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.5563995786518913, "ground_truth": 0}, {"key": "62827a1a377491d88adcbac25ecf14a64b5f997b", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.4941408878282127, "ground_truth": 0}, {"key": "62827a1a377491d88adcbac25ecf14a64b5f997b", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.5755880240118137, "ground_truth": 0}, {"key": "62827a1a377491d88adcbac25ecf14a64b5f997b", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.6406358511208409, "ground_truth": 0}, {"key": "62827a1a377491d88adcbac25ecf14a64b5f997b", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.40733342638676, "ground_truth": 0}, {"key": "62827a1a377491d88adcbac25ecf14a64b5f997b", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.590779199254778, "ground_truth": 0}, {"key": "d42463e1093a92ec4dbd20edd8f4bf3306f00f3f", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.08570928254389944, "ground_truth": 0}, {"key": "d42463e1093a92ec4dbd20edd8f4bf3306f00f3f", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.13939638814125355, "ground_truth": 0}, {"key": "d42463e1093a92ec4dbd20edd8f4bf3306f00f3f", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.11516222734224103, "ground_truth": 0}, {"key": "d42463e1093a92ec4dbd20edd8f4bf3306f00f3f", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.13568954808583505, "ground_truth": 0}, {"key": "d42463e1093a92ec4dbd20edd8f4bf3306f00f3f", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.05223085308386875, "ground_truth": 0}, {"key": "4b0eda92463958cce8c6b2537db39088e1254552", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.5331544091750614, "ground_truth": 0}, {"key": "4b0eda92463958cce8c6b2537db39088e1254552", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.7534666674569176, "ground_truth": 0}, {"key": "4b0eda92463958cce8c6b2537db39088e1254552", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.6706082739438005, "ground_truth": 0}, {"key": "4b0eda92463958cce8c6b2537db39088e1254552", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.5736783940921739, "ground_truth": 0}, {"key": "4b0eda92463958cce8c6b2537db39088e1254552", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.42823341242695784, "ground_truth": 0}, {"key": "e117408ad19cc69e15b1e21b9ae54f10c07223ce", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.44552957707845836, "ground_truth": 0}, {"key": "e117408ad19cc69e15b1e21b9ae54f10c07223ce", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.550607376620508, "ground_truth": 0}, {"key": "e117408ad19cc69e15b1e21b9ae54f10c07223ce", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.7341195377954176, "ground_truth": 0}, {"key": "e117408ad19cc69e15b1e21b9ae54f10c07223ce", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.4397473388292943, "ground_truth": 0}, {"key": "e117408ad19cc69e15b1e21b9ae54f10c07223ce", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.7994423185906973, "ground_truth": 0}, {"key": "3c5b68b58c34853baa534d1265ec7fde00d4eb4e", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.5156199190580321, "ground_truth": 0}, {"key": "3c5b68b58c34853baa534d1265ec7fde00d4eb4e", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.40922077804222434, "ground_truth": 0}, {"key": "3c5b68b58c34853baa534d1265ec7fde00d4eb4e", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.8469578378429844, "ground_truth": 0}, {"key": "3c5b68b58c34853baa534d1265ec7fde00d4eb4e", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.5794004040648842, "ground_truth": 0}, {"key": "3c5b68b58c34853baa534d1265ec7fde00d4eb4e", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.6548947386928471, "ground_truth": 0}, {"key": "6c3d2feed04c75063d182103f0585c45da9aaa1b", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.43782350230265776, "ground_truth": 0}, {"key": "6c3d2feed04c75063d182103f0585c45da9aaa1b", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.278256780794585, "ground_truth": 0}, {"key": "6c3d2feed04c75063d182103f0585c45da9aaa1b", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.542863305676332, "ground_truth": 0}, {"key": "6c3d2feed04c75063d182103f0585c45da9aaa1b", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.4378234978106226, "ground_truth": 0}, {"key": "6c3d2feed04c75063d182103f0585c45da9aaa1b", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.34158251837485465, "ground_truth": 0}, {"key": "4fa1c0bd7f86368d7ae7730d95ff7e73dc9172da", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.26435835680755554, "ground_truth": 0}, {"key": "4fa1c0bd7f86368d7ae7730d95ff7e73dc9172da", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.3486451180205778, "ground_truth": 0}, {"key": "4fa1c0bd7f86368d7ae7730d95ff7e73dc9172da", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.6601723697613665, "ground_truth": 0}, {"key": "4fa1c0bd7f86368d7ae7730d95ff7e73dc9172da", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.9740426457364373, "ground_truth": 0}, {"key": "4fa1c0bd7f86368d7ae7730d95ff7e73dc9172da", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.7718435100370864, "ground_truth": 0}, {"key": "282f1910bd57e50d4401c695ebe75b817de68548", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.8116760280760043, "ground_truth": 0}, {"key": "282f1910bd57e50d4401c695ebe75b817de68548", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.8300437699372186, "ground_truth": 0}, {"key": "282f1910bd57e50d4401c695ebe75b817de68548", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.7386690603684527, "ground_truth": 0}, {"key": "282f1910bd57e50d4401c695ebe75b817de68548", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.7520125649748679, "ground_truth": 0}, {"key": "282f1910bd57e50d4401c695ebe75b817de68548", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.8056321676414953, "ground_truth": 0}, {"key": "af2d712599be471d1ba0b91fa18c347220ca595d", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.46295859543695145, "ground_truth": 0}, {"key": "af2d712599be471d1ba0b91fa18c347220ca595d", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.6076631670303256, "ground_truth": 0}, {"key": "af2d712599be471d1ba0b91fa18c347220ca595d", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.5640984894000316, "ground_truth": 0}, {"key": "af2d712599be471d1ba0b91fa18c347220ca595d", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.5486735195057688, "ground_truth": 0}, {"key": "af2d712599be471d1ba0b91fa18c347220ca595d", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.7057850152336623, "ground_truth": 0}, {"key": "e3dd06d326c8d53722bdc5c8428e29c68a60d0d5", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.28776780846877287, "ground_truth": 0}, {"key": "e3dd06d326c8d53722bdc5c8428e29c68a60d0d5", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.38676344478096186, "ground_truth": 0}, {"key": "e3dd06d326c8d53722bdc5c8428e29c68a60d0d5", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.3522017876539135, "ground_truth": 0}, {"key": "e3dd06d326c8d53722bdc5c8428e29c68a60d0d5", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.17106118750416113, "ground_truth": 0}, {"key": "e3dd06d326c8d53722bdc5c8428e29c68a60d0d5", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.3904758216060354, "ground_truth": 0}, {"key": "493fa8c40d1bc26ed1d25633c779b13bc33efdba", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.2523840292336294, "ground_truth": 0}, {"key": "493fa8c40d1bc26ed1d25633c779b13bc33efdba", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.4649015663847029, "ground_truth": 0}, {"key": "493fa8c40d1bc26ed1d25633c779b13bc33efdba", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.6076631632439973, "ground_truth": 0}, {"key": "493fa8c40d1bc26ed1d25633c779b13bc33efdba", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.34510526658138374, "ground_truth": 0}, {"key": "493fa8c40d1bc26ed1d25633c779b13bc33efdba", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.23651623031762697, "ground_truth": 0}, {"key": "56d7d67bb0fc32ee71cc006b915244776d883661", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.47073659510552834, "ground_truth": 0}, {"key": "56d7d67bb0fc32ee71cc006b915244776d883661", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.5506073727914595, "ground_truth": 0}, {"key": "56d7d67bb0fc32ee71cc006b915244776d883661", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.18010666074849696, "ground_truth": 0}, {"key": "56d7d67bb0fc32ee71cc006b915244776d883661", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.2782568107892729, "ground_truth": 0}, {"key": "56d7d67bb0fc32ee71cc006b915244776d883661", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.4551985976331787, "ground_truth": 0}, {"key": "2b08ee205946dc0bb6ffe0db654cbbba1199eb28", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.6169358145970988, "ground_truth": 0}, {"key": "2b08ee205946dc0bb6ffe0db654cbbba1199eb28", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.5292633901758426, "ground_truth": 0}, {"key": "2b08ee205946dc0bb6ffe0db654cbbba1199eb28", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.6926419712096611, "ground_truth": 0}, {"key": "2b08ee205946dc0bb6ffe0db654cbbba1199eb28", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.7074047051744372, "ground_truth": 0}, {"key": "2b08ee205946dc0bb6ffe0db654cbbba1199eb28", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.5292633926104503, "ground_truth": 0}, {"key": "782c4bdaee73189103d2e05748717b3ea0e89e5d", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.5869964224068511, "ground_truth": 0}, {"key": "782c4bdaee73189103d2e05748717b3ea0e89e5d", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.6943026829532453, "ground_truth": 0}, {"key": "782c4bdaee73189103d2e05748717b3ea0e89e5d", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.43206335885412545, "ground_truth": 0}, {"key": "782c4bdaee73189103d2e05748717b3ea0e89e5d", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.5234203416428026, "ground_truth": 0}, {"key": "782c4bdaee73189103d2e05748717b3ea0e89e5d", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.6224593231221723, "ground_truth": 0}, {"key": "87385fb51ac9eaf76e8421723c94410f724750fc", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.14414886871787047, "ground_truth": 0}, {"key": "87385fb51ac9eaf76e8421723c94410f724750fc", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.4980469076901043, "ground_truth": 0}, {"key": "87385fb51ac9eaf76e8421723c94410f724750fc", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.533154410207666, "ground_truth": 0}, {"key": "87385fb51ac9eaf76e8421723c94410f724750fc", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.2254166128220712, "ground_truth": 0}, {"key": "87385fb51ac9eaf76e8421723c94410f724750fc", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.1871326814531704, "ground_truth": 0}, {"key": "20528eb48341b50c0083fcf5a9d114b39040e5c1", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.32939170993784744, "ground_truth": 0}, {"key": "20528eb48341b50c0083fcf5a9d114b39040e5c1", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.5755880084586991, "ground_truth": 0}, {"key": "20528eb48341b50c0083fcf5a9d114b39040e5c1", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.653126933695677, "ground_truth": 0}, {"key": "20528eb48341b50c0083fcf5a9d114b39040e5c1", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.42059959370799277, "ground_truth": 0}, {"key": "20528eb48341b50c0083fcf5a9d114b39040e5c1", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.7634837448680811, "ground_truth": 0}, {"key": "412630c97420afb50e5278d3406e0cf4b08d0b77", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.10158944994692422, "ground_truth": 0}, {"key": "412630c97420afb50e5278d3406e0cf4b08d0b77", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.059210247643358124, "ground_truth": 0}, {"key": "412630c97420afb50e5278d3406e0cf4b08d0b77", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.17553807585818437, "ground_truth": 0}, {"key": "412630c97420afb50e5278d3406e0cf4b08d0b77", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.13386750204933553, "ground_truth": 0}, {"key": "412630c97420afb50e5278d3406e0cf4b08d0b77", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.08449275824992106, "ground_truth": 0}, {"key": "dcd60a85e1e17ec0163a925c9412d480fd08072f", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.5717666367870008, "ground_truth": 0}, {"key": "dcd60a85e1e17ec0163a925c9412d480fd08072f", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.5544704437424409, "ground_truth": 0}, {"key": "dcd60a85e1e17ec0163a925c9412d480fd08072f", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.4532618671124688, "ground_truth": 0}, {"key": "dcd60a85e1e17ec0163a925c9412d480fd08072f", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.3539862949283602, "ground_truth": 0}, {"key": "dcd60a85e1e17ec0163a925c9412d480fd08072f", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.3960681597457253, "ground_truth": 0}, {"key": "805644d370fae7b0492174c54c00e86eff742735", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.7704647693117448, "ground_truth": 0}, {"key": "805644d370fae7b0492174c54c00e86eff742735", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.7813306110377102, "ground_truth": 0}, {"key": "805644d370fae7b0492174c54c00e86eff742735", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.6601723511383293, "ground_truth": 0}, {"key": "805644d370fae7b0492174c54c00e86eff742735", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.4726834787853147, "ground_truth": 0}, {"key": "805644d370fae7b0492174c54c00e86eff742735", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.6113819853395047, "ground_truth": 0}, {"key": "3aa0ef8cac31a60076c43a9484792b59372edb64", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.26435832591744873, "ground_truth": 0}, {"key": "3aa0ef8cac31a60076c43a9484792b59372edb64", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.31742625610806247, "ground_truth": 0}, {"key": "3aa0ef8cac31a60076c43a9484792b59372edb64", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.7534666534903911, "ground_truth": 0}, {"key": "3aa0ef8cac31a60076c43a9484792b59372edb64", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.28298810223353527, "ground_truth": 0}, {"key": "3aa0ef8cac31a60076c43a9484792b59372edb64", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.4824290896043735, "ground_truth": 0}, {"key": "4cf51ce9372dff8ff7f44f098eab1c1d7569af7a", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.10894504735682274, "ground_truth": 0}, {"key": "4cf51ce9372dff8ff7f44f098eab1c1d7569af7a", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.3738758358999858, "ground_truth": 0}, {"key": "4cf51ce9372dff8ff7f44f098eab1c1d7569af7a", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.28937168620766196, "ground_truth": 0}, {"key": "4cf51ce9372dff8ff7f44f098eab1c1d7569af7a", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.12765262253275642, "ground_truth": 0}, {"key": "4cf51ce9372dff8ff7f44f098eab1c1d7569af7a", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.30569732092952207, "ground_truth": 0}, {"key": "ea06fd0b25cb9793397a51de73fd83f91b4323fa", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.47073659256131073, "ground_truth": 0}, {"key": "ea06fd0b25cb9793397a51de73fd83f91b4323fa", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.5253688119991382, "ground_truth": 0}, {"key": "ea06fd0b25cb9793397a51de73fd83f91b4323fa", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.5660185393717615, "ground_truth": 0}, {"key": "ea06fd0b25cb9793397a51de73fd83f91b4323fa", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.5926666184545827, "ground_truth": 0}, {"key": "ea06fd0b25cb9793397a51de73fd83f91b4323fa", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.6513548579005958, "ground_truth": 0}, {"key": "a150e93fa52eaba281aae9eabe28b3ee4155f296", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.08509904671052075, "ground_truth": 0}, {"key": "a150e93fa52eaba281aae9eabe28b3ee4155f296", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.16885693370855911, "ground_truth": 0}, {"key": "a150e93fa52eaba281aae9eabe28b3ee4155f296", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.21337716955401254, "ground_truth": 0}, {"key": "a150e93fa52eaba281aae9eabe28b3ee4155f296", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.4167966342163214, "ground_truth": 0}, {"key": "a150e93fa52eaba281aae9eabe28b3ee4155f296", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.125922754429807, "ground_truth": 0}, {"key": "a0a84718168357049273f6e65133fd06e67cd6d2", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.5097644088023218, "ground_truth": 0}, {"key": "a0a84718168357049273f6e65133fd06e67cd6d2", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.3665897502275433, "ground_truth": 0}, {"key": "a0a84718168357049273f6e65133fd06e67cd6d2", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.5097643751306653, "ground_truth": 0}, {"key": "a0a84718168357049273f6e65133fd06e67cd6d2", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.5136684465655642, "ground_truth": 0}, {"key": "a0a84718168357049273f6e65133fd06e67cd6d2", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.44167301016515065, "ground_truth": 0}, {"key": "b5833a27ee69d7540435e3c70af040c2b743f541", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.3647775558463553, "ground_truth": 0}, {"key": "b5833a27ee69d7540435e3c70af040c2b743f541", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.5253688315119077, "ground_truth": 0}, {"key": "b5833a27ee69d7540435e3c70af040c2b743f541", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.43398147026054223, "ground_truth": 0}, {"key": "b5833a27ee69d7540435e3c70af040c2b743f541", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.5964331810054161, "ground_truth": 0}, {"key": "b5833a27ee69d7540435e3c70af040c2b743f541", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.447460260938962, "ground_truth": 0}, {"key": "98dbba54da2a05bb04320aa0e4fb05fba3d75b63", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.5698526629718311, "ground_truth": 0}, {"key": "98dbba54da2a05bb04320aa0e4fb05fba3d75b63", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.5273165486665128, "ground_truth": 0}, {"key": "98dbba54da2a05bb04320aa0e4fb05fba3d75b63", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.5019531419620611, "ground_truth": 0}, {"key": "98dbba54da2a05bb04320aa0e4fb05fba3d75b63", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.5448013929951585, "ground_truth": 0}, {"key": "98dbba54da2a05bb04320aa0e4fb05fba3d75b63", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.7025300390709895, "ground_truth": 0}, {"key": "4a30d8e9ba08a56c1d503d719525113545c414e3", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.20946969073362223, "ground_truth": 0}, {"key": "4a30d8e9ba08a56c1d503d719525113545c414e3", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.4263215708040737, "ground_truth": 0}, {"key": "4a30d8e9ba08a56c1d503d719525113545c414e3", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.4073334050966361, "ground_truth": 0}, {"key": "4a30d8e9ba08a56c1d503d719525113545c414e3", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.18713268286721088, "ground_truth": 0}, {"key": "4a30d8e9ba08a56c1d503d719525113545c414e3", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.7041601651573434, "ground_truth": 0}, {"key": "c3acabb0c18cc7615eb3796406500fba1b148d3d", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.11124121778811079, "ground_truth": 0}, {"key": "c3acabb0c18cc7615eb3796406500fba1b148d3d", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.14223189668881284, "ground_truth": 0}, {"key": "c3acabb0c18cc7615eb3796406500fba1b148d3d", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.12085322312055591, "ground_truth": 0}, {"key": "c3acabb0c18cc7615eb3796406500fba1b148d3d", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.16132023374806084, "ground_truth": 0}, {"key": "c3acabb0c18cc7615eb3796406500fba1b148d3d", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.1208532298801094, "ground_truth": 0}, {"key": "1c1acc74329fe61636f900df9dbcef5ed695e5c9", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.6113819636975533, "ground_truth": 0}, {"key": "1c1acc74329fe61636f900df9dbcef5ed695e5c9", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.7446563519085863, "ground_truth": 0}, {"key": "1c1acc74329fe61636f900df9dbcef5ed695e5c9", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.5717666078917766, "ground_truth": 0}, {"key": "1c1acc74329fe61636f900df9dbcef5ed695e5c9", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.7138307287455528, "ground_truth": 0}, {"key": "1c1acc74329fe61636f900df9dbcef5ed695e5c9", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.6095241471552737, "ground_truth": 0}, {"key": "f70a7abb6c5b0ef383ea12a4d9ca046a5bd854e5", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.11838510925870878, "ground_truth": 0}, {"key": "f70a7abb6c5b0ef383ea12a4d9ca046a5bd854e5", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.3886180420174269, "ground_truth": 0}, {"key": "f70a7abb6c5b0ef383ea12a4d9ca046a5bd854e5", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.1412814170023071, "ground_truth": 0}, {"key": "f70a7abb6c5b0ef383ea12a4d9ca046a5bd854e5", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.31405054225444257, "ground_truth": 0}, {"key": "f70a7abb6c5b0ef383ea12a4d9ca046a5bd854e5", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.21469141325589652, "ground_truth": 0}, {"key": "a3dd38ec7bc9d7e8423b96d8fd0641a2a5d5c984", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.5774953613050058, "ground_truth": 0}, {"key": "a3dd38ec7bc9d7e8423b96d8fd0641a2a5d5c984", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.5964331575567571, "ground_truth": 0}, {"key": "a3dd38ec7bc9d7e8423b96d8fd0641a2a5d5c984", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.48633151062641533, "ground_truth": 0}, {"key": "a3dd38ec7bc9d7e8423b96d8fd0641a2a5d5c984", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.39606814237104554, "ground_truth": 0}, {"key": "a3dd38ec7bc9d7e8423b96d8fd0641a2a5d5c984", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.37204877226981264, "ground_truth": 0}, {"key": "654c6b29b96d2a5a818d91400c20f838b0e8b6df", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.09334687443784959, "ground_truth": 0}, {"key": "654c6b29b96d2a5a818d91400c20f838b0e8b6df", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.11201593880500355, "ground_truth": 0}, {"key": "654c6b29b96d2a5a818d91400c20f838b0e8b6df", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.1347759225817853, "ground_truth": 0}, {"key": "654c6b29b96d2a5a818d91400c20f838b0e8b6df", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.2323101557730021, "ground_truth": 0}, {"key": "654c6b29b96d2a5a818d91400c20f838b0e8b6df", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.13939637746845918, "ground_truth": 0}, {"key": "764d9ce99a1e3f79d95fbc4b68adbce14e7f8bcd", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.30569731425541846, "ground_truth": 0}, {"key": "764d9ce99a1e3f79d95fbc4b68adbce14e7f8bcd", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.48047868501714464, "ground_truth": 0}, {"key": "764d9ce99a1e3f79d95fbc4b68adbce14e7f8bcd", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.29746995222595124, "ground_truth": 0}, {"key": "764d9ce99a1e3f79d95fbc4b68adbce14e7f8bcd", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.1677633424184561, "ground_truth": 0}, {"key": "764d9ce99a1e3f79d95fbc4b68adbce14e7f8bcd", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.23510838789006594, "ground_truth": 0}, {"key": "f16446db34e2861f0450dfa34d8cdda541ab7b19", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.4921881313454991, "ground_truth": 0}, {"key": "f16446db34e2861f0450dfa34d8cdda541ab7b19", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.5039061738297407, "ground_truth": 0}, {"key": "f16446db34e2861f0450dfa34d8cdda541ab7b19", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.28457600485263906, "ground_truth": 0}, {"key": "f16446db34e2861f0450dfa34d8cdda541ab7b19", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.375706467549969, "ground_truth": 0}, {"key": "f16446db34e2861f0450dfa34d8cdda541ab7b19", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.39606819171089175, "ground_truth": 0}, {"key": "3e910c5b8425cd7c871a402a32ca44680b53ce5e", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.29421495962744226, "ground_truth": 0}, {"key": "3e910c5b8425cd7c871a402a32ca44680b53ce5e", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.30404165033240355, "ground_truth": 0}, {"key": "3e910c5b8425cd7c871a402a32ca44680b53ce5e", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.22815651196220108, "ground_truth": 0}, {"key": "3e910c5b8425cd7c871a402a32ca44680b53ce5e", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.24798741482129527, "ground_truth": 0}, {"key": "3e910c5b8425cd7c871a402a32ca44680b53ce5e", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.15610489450692236, "ground_truth": 0}, {"key": "973c14551fc97a1eef094bd0f33356d9e6836234", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.1688569439750706, "ground_truth": 0}, {"key": "973c14551fc97a1eef094bd0f33356d9e6836234", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.3923368452500605, "ground_truth": 0}, {"key": "973c14551fc97a1eef094bd0f33356d9e6836234", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.4863315246368252, "ground_truth": 0}, {"key": "973c14551fc97a1eef094bd0f33356d9e6836234", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.40356686966201527, "ground_truth": 0}, {"key": "973c14551fc97a1eef094bd0f33356d9e6836234", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.29910517248918417, "ground_truth": 0}, {"key": "725938611c7dca6f876ada93b1d68b29ad25ce38", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.36840569157409275, "ground_truth": 0}, {"key": "725938611c7dca6f876ada93b1d68b29ad25ce38", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.3486451371531025, "ground_truth": 0}, {"key": "725938611c7dca6f876ada93b1d68b29ad25ce38", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.37937837614504616, "ground_truth": 0}, {"key": "725938611c7dca6f876ada93b1d68b29ad25ce38", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.41679664456344606, "ground_truth": 0}, {"key": "725938611c7dca6f876ada93b1d68b29ad25ce38", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.2925952923458918, "ground_truth": 0}, {"key": "28dbcf0c8624d9914a4e4292f872f17b063547c2", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.8479677609636485, "ground_truth": 0}, {"key": "28dbcf0c8624d9914a4e4292f872f17b063547c2", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.7759445393736772, "ground_truth": 0}, {"key": "28dbcf0c8624d9914a4e4292f872f17b063547c2", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.558327002867064, "ground_truth": 0}, {"key": "28dbcf0c8624d9914a4e4292f872f17b063547c2", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.45132651663467444, "ground_truth": 0}, {"key": "28dbcf0c8624d9914a4e4292f872f17b063547c2", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.8864203941409263, "ground_truth": 0}, {"key": "4567b2098569ee4346cfdede5819257af4ee9c0f", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.5389832439697266, "ground_truth": 0}, {"key": "4567b2098569ee4346cfdede5819257af4ee9c0f", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.7476159550215998, "ground_truth": 0}, {"key": "4567b2098569ee4346cfdede5819257af4ee9c0f", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.35042138801207257, "ground_truth": 0}, {"key": "4567b2098569ee4346cfdede5819257af4ee9c0f", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.5983121861954929, "ground_truth": 0}, {"key": "4567b2098569ee4346cfdede5819257af4ee9c0f", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.3363310279946785, "ground_truth": 0}, {"key": "d0404188997ef57e0355b18fb867599b89c80407", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.4339814627108938, "ground_truth": 0}, {"key": "d0404188997ef57e0355b18fb867599b89c80407", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.5888890981982107, "ground_truth": 0}, {"key": "d0404188997ef57e0355b18fb867599b89c80407", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.519521297123296, "ground_truth": 0}, {"key": "d0404188997ef57e0355b18fb867599b89c80407", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.6095241694949162, "ground_truth": 0}, {"key": "d0404188997ef57e0355b18fb867599b89c80407", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.5448013889533767, "ground_truth": 0}, {"key": "ab10b3f8c4a6cca7aea94298447b13bc0721fe69", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.43014734651104725, "ground_truth": 0}, {"key": "ab10b3f8c4a6cca7aea94298447b13bc0721fe69", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.6601723605324332, "ground_truth": 0}, {"key": "ab10b3f8c4a6cca7aea94298447b13bc0721fe69", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.6261241699798006, "ground_truth": 0}, {"key": "ab10b3f8c4a6cca7aea94298447b13bc0721fe69", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.6688802444176403, "ground_truth": 0}, {"key": "ab10b3f8c4a6cca7aea94298447b13bc0721fe69", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.6757646026795334, "ground_truth": 0}, {"key": "7c11a3353593edde95bae0ee6178fb1d1855baed", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.33807710805073465, "ground_truth": 0}, {"key": "7c11a3353593edde95bae0ee6178fb1d1855baed", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.2942149960014275, "ground_truth": 0}, {"key": "7c11a3353593edde95bae0ee6178fb1d1855baed", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.14223190413575088, "ground_truth": 0}, {"key": "7c11a3353593edde95bae0ee6178fb1d1855baed", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.41300358667106063, "ground_truth": 0}, {"key": "7c11a3353593edde95bae0ee6178fb1d1855baed", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.23651622494546232, "ground_truth": 0}, {"key": "487b272b94a620f9660e89bbf6ebab3ffdf1bf06", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.11757213217315696, "ground_truth": 0}, {"key": "487b272b94a620f9660e89bbf6ebab3ffdf1bf06", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.22270016590097996, "ground_truth": 0}, {"key": "487b272b94a620f9660e89bbf6ebab3ffdf1bf06", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.2598256318886931, "ground_truth": 0}, {"key": "487b272b94a620f9660e89bbf6ebab3ffdf1bf06", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.12506537530468717, "ground_truth": 0}, {"key": "487b272b94a620f9660e89bbf6ebab3ffdf1bf06", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.16238002170456312, "ground_truth": 0}, {"key": "e1b6f4701835710d3f518729188754fcd7061289", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.4668455820253439, "ground_truth": 0}, {"key": "e1b6f4701835710d3f518729188754fcd7061289", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.2704802410782364, "ground_truth": 0}, {"key": "e1b6f4701835710d3f518729188754fcd7061289", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.4073333845799062, "ground_truth": 0}, {"key": "e1b6f4701835710d3f518729188754fcd7061289", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.31912136620391124, "ground_truth": 0}, {"key": "e1b6f4701835710d3f518729188754fcd7061289", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.38121954662114677, "ground_truth": 0}, {"key": "45027afbe54056c567ca8a48906dd06200f6d8c1", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.513668485282747, "ground_truth": 0}, {"key": "45027afbe54056c567ca8a48906dd06200f6d8c1", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.7620701045740637, "ground_truth": 0}, {"key": "45027afbe54056c567ca8a48906dd06200f6d8c1", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.6723316796425458, "ground_truth": 0}, {"key": "45027afbe54056c567ca8a48906dd06200f6d8c1", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.6531269365254561, "ground_truth": 0}, {"key": "45027afbe54056c567ca8a48906dd06200f6d8c1", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.8210441131431816, "ground_truth": 0}, {"key": "e8c2d4a1d20efb0606506435ebcbf486e9eb4146", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.24508501936551153, "ground_truth": 0}, {"key": "e8c2d4a1d20efb0606506435ebcbf486e9eb4146", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.2689414047400292, "ground_truth": 0}, {"key": "e8c2d4a1d20efb0606506435ebcbf486e9eb4146", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.19193277951978738, "ground_truth": 0}, {"key": "e8c2d4a1d20efb0606506435ebcbf486e9eb4146", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.13117323116313961, "ground_truth": 0}, {"key": "e8c2d4a1d20efb0606506435ebcbf486e9eb4146", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.3775406665292372, "ground_truth": 0}, {"key": "da0ea6b7eae20528c7ec822fb77d8e8f78ba09b8", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.38491214806514795, "ground_truth": 0}, {"key": "da0ea6b7eae20528c7ec822fb77d8e8f78ba09b8", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.25386100086884095, "ground_truth": 0}, {"key": "da0ea6b7eae20528c7ec822fb77d8e8f78ba09b8", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.455198589060497, "ground_truth": 0}, {"key": "da0ea6b7eae20528c7ec822fb77d8e8f78ba09b8", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.3904758458282358, "ground_truth": 0}, {"key": "da0ea6b7eae20528c7ec822fb77d8e8f78ba09b8", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.4436004348704002, "ground_truth": 0}, {"key": "42ab0385b3bb93236804c2abc9ff261b6ec79872", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.3242353956093315, "ground_truth": 0}, {"key": "42ab0385b3bb93236804c2abc9ff261b6ec79872", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.2068940523893658, "ground_truth": 0}, {"key": "42ab0385b3bb93236804c2abc9ff261b6ec79872", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.41869692176523454, "ground_truth": 0}, {"key": "42ab0385b3bb93236804c2abc9ff261b6ec79872", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.34158250266996965, "ground_truth": 0}, {"key": "42ab0385b3bb93236804c2abc9ff261b6ec79872", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.18594717916953907, "ground_truth": 0}, {"key": "3ad31f0dd26f2dce06da1c10ced8d601bd5594c5", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.38306416654266484, "ground_truth": 0}, {"key": "3ad31f0dd26f2dce06da1c10ced8d601bd5594c5", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.3328523283913292, "ground_truth": 0}, {"key": "3ad31f0dd26f2dce06da1c10ced8d601bd5594c5", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.3259495315478204, "ground_truth": 0}, {"key": "3ad31f0dd26f2dce06da1c10ced8d601bd5594c5", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.2479874239430617, "ground_truth": 0}, {"key": "3ad31f0dd26f2dce06da1c10ced8d601bd5594c5", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.1451153653392301, "ground_truth": 0}, {"key": "a142b867b5b52449a790e8a2942654fd880cd2e4", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.7732163578395761, "ground_truth": 0}, {"key": "a142b867b5b52449a790e8a2942654fd880cd2e4", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.9026096098622621, "ground_truth": 0}, {"key": "a142b867b5b52449a790e8a2942654fd880cd2e4", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.6636689166137228, "ground_truth": 0}, {"key": "a142b867b5b52449a790e8a2942654fd880cd2e4", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.5, "ground_truth": 0}, {"key": "a142b867b5b52449a790e8a2942654fd880cd2e4", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.8198933285810664, "ground_truth": 0}, {"key": "04b39ee42fdc4284e402fbf7cdc7b825748f38b5", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.9059898151788633, "ground_truth": 0}, {"key": "04b39ee42fdc4284e402fbf7cdc7b825748f38b5", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.7931059460681344, "ground_truth": 0}, {"key": "04b39ee42fdc4284e402fbf7cdc7b825748f38b5", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.8879840533464202, "ground_truth": 0}, {"key": "04b39ee42fdc4284e402fbf7cdc7b825748f38b5", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.600188350157169, "ground_truth": 0}, {"key": "04b39ee42fdc4284e402fbf7cdc7b825748f38b5", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.9294404043441395, "ground_truth": 0}, {"key": "ddafab36467762e9f1856687a7ef0e801243dace", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.3090237175658277, "ground_truth": 0}, {"key": "ddafab36467762e9f1856687a7ef0e801243dace", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.45326185604544167, "ground_truth": 0}, {"key": "ddafab36467762e9f1856687a7ef0e801243dace", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.12506539246568918, "ground_truth": 0}, {"key": "ddafab36467762e9f1856687a7ef0e801243dace", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.23792990217348972, "ground_truth": 0}, {"key": "ddafab36467762e9f1856687a7ef0e801243dace", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.33458942852118206, "ground_truth": 0}, {"key": "6c177720c8623edcaefc45111018f98811c29693", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.43782352141014075, "ground_truth": 0}, {"key": "6c177720c8623edcaefc45111018f98811c29693", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.14706452158788083, "ground_truth": 0}, {"key": "6c177720c8623edcaefc45111018f98811c29693", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.14903529052976613, "ground_truth": 0}, {"key": "6c177720c8623edcaefc45111018f98811c29693", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.17553806888030501, "ground_truth": 0}, {"key": "6c177720c8623edcaefc45111018f98811c29693", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.30735800521669115, "ground_truth": 0}, {"key": "5365dfc7c7079ade7d090530f5ce0d8995a8f1cc", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.5292634028500789, "ground_truth": 0}, {"key": "5365dfc7c7079ade7d090530f5ce0d8995a8f1cc", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.6671476781212932, "ground_truth": 0}, {"key": "5365dfc7c7079ade7d090530f5ce0d8995a8f1cc", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.7106283104438237, "ground_truth": 0}, {"key": "5365dfc7c7079ade7d090530f5ce0d8995a8f1cc", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.6424324707920057, "ground_truth": 0}, {"key": "5365dfc7c7079ade7d090530f5ce0d8995a8f1cc", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.40733340006568625, "ground_truth": 0}, {"key": "6235695e9e69aa35c488636fc63bae84d1e2ca1f", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.24653335957841804, "ground_truth": 0}, {"key": "6235695e9e69aa35c488636fc63bae84d1e2ca1f", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.2628418356144858, "ground_truth": 0}, {"key": "6235695e9e69aa35c488636fc63bae84d1e2ca1f", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.11279540202224275, "ground_truth": 0}, {"key": "6235695e9e69aa35c488636fc63bae84d1e2ca1f", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.3998116483343077, "ground_truth": 0}, {"key": "6235695e9e69aa35c488636fc63bae84d1e2ca1f", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.2068940415291274, "ground_truth": 0}, {"key": "d954f33da49f4c839a6f4dadc446a4c30328c572", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.8255897130907193, "ground_truth": 0}, {"key": "d954f33da49f4c839a6f4dadc446a4c30328c572", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.8766343724125599, "ground_truth": 0}, {"key": "d954f33da49f4c839a6f4dadc446a4c30328c572", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.7476159418171211, "ground_truth": 0}, {"key": "d954f33da49f4c839a6f4dadc446a4c30328c572", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.5869963916028447, "ground_truth": 0}, {"key": "d954f33da49f4c839a6f4dadc446a4c30328c572", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.6370307943963889, "ground_truth": 0}, {"key": "5bdab1456ce6156a7378edaa4fa92a718cbf2568", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.20561504858177154, "ground_truth": 0}, {"key": "5bdab1456ce6156a7378edaa4fa92a718cbf2568", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.31069440104653295, "ground_truth": 0}, {"key": "5bdab1456ce6156a7378edaa4fa92a718cbf2568", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.16885695226011435, "ground_truth": 0}, {"key": "5bdab1456ce6156a7378edaa4fa92a718cbf2568", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.1919327941110277, "ground_truth": 0}, {"key": "5bdab1456ce6156a7378edaa4fa92a718cbf2568", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.4436004154617595, "ground_truth": 0}, {"key": "c03cd67baa8d84240b962876a5aaa2036d4f5275", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.3793783960933622, "ground_truth": 0}, {"key": "c03cd67baa8d84240b962876a5aaa2036d4f5275", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.5, "ground_truth": 0}, {"key": "c03cd67baa8d84240b962876a5aaa2036d4f5275", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.5717665932072453, "ground_truth": 0}, {"key": "c03cd67baa8d84240b962876a5aaa2036d4f5275", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.3539862849029879, "ground_truth": 0}, {"key": "c03cd67baa8d84240b962876a5aaa2036d4f5275", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.5156199133434493, "ground_truth": 0}, {"key": "e2847808e1990f51cd54eccd660640c44638f088", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.034618838397330924, "ground_truth": 0}, {"key": "e2847808e1990f51cd54eccd660640c44638f088", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.10374863271273148, "ground_truth": 0}, {"key": "e2847808e1990f51cd54eccd660640c44638f088", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.07263671109700807, "ground_truth": 0}, {"key": "e2847808e1990f51cd54eccd660640c44638f088", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.09203286128870727, "ground_truth": 0}, {"key": "e2847808e1990f51cd54eccd660640c44638f088", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.13846178483281119, "ground_truth": 0}, {"key": "fbc2d5f3f088eda2b8128ebb12a042850f6e4f3d", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.2861692550573389, "ground_truth": 0}, {"key": "fbc2d5f3f088eda2b8128ebb12a042850f6e4f3d", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.184767504376361, "ground_truth": 0}, {"key": "fbc2d5f3f088eda2b8128ebb12a042850f6e4f3d", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.1789558895884597, "ground_truth": 0}, {"key": "fbc2d5f3f088eda2b8128ebb12a042850f6e4f3d", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.3276683225292694, "ground_truth": 0}, {"key": "fbc2d5f3f088eda2b8128ebb12a042850f6e4f3d", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.33285231664778975, "ground_truth": 0}, {"key": "6f0d219aba6227e0a69e71e7fca4b85ae761101d", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.28140560363814804, "ground_truth": 0}, {"key": "6f0d219aba6227e0a69e71e7fca4b85ae761101d", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.4263216087681465, "ground_truth": 0}, {"key": "6f0d219aba6227e0a69e71e7fca4b85ae761101d", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.4707365976579093, "ground_truth": 0}, {"key": "6f0d219aba6227e0a69e71e7fca4b85ae761101d", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.22405544089253668, "ground_truth": 0}, {"key": "6f0d219aba6227e0a69e71e7fca4b85ae761101d", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.26740813627996723, "ground_truth": 0}, {"key": "8c71492f2a3fbe7eb9c8205d65054ab14c1dbdb6", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.3023910887694815, "ground_truth": 0}, {"key": "8c71492f2a3fbe7eb9c8205d65054ab14c1dbdb6", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.5350984277662224, "ground_truth": 0}, {"key": "8c71492f2a3fbe7eb9c8205d65054ab14c1dbdb6", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.5679366320835182, "ground_truth": 0}, {"key": "8c71492f2a3fbe7eb9c8205d65054ab14c1dbdb6", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.4148988392125903, "ground_truth": 0}, {"key": "8c71492f2a3fbe7eb9c8205d65054ab14c1dbdb6", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.4941408932419584, "ground_truth": 0}, {"key": "860cea3a6afb8527d26e9234ccba560a39eff2a7", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.3208212942920085, "ground_truth": 0}, {"key": "860cea3a6afb8527d26e9234ccba560a39eff2a7", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.20434191089013679, "ground_truth": 0}, {"key": "860cea3a6afb8527d26e9234ccba560a39eff2a7", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.531209368333842, "ground_truth": 0}, {"key": "860cea3a6afb8527d26e9234ccba560a39eff2a7", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.377540657838957, "ground_truth": 0}, {"key": "860cea3a6afb8527d26e9234ccba560a39eff2a7", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.3886180361464183, "ground_truth": 0}, {"key": "0914e3c80a676e14e225504cb759103503f3f1e0", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.8732148236823547, "ground_truth": 0}, {"key": "0914e3c80a676e14e225504cb759103503f3f1e0", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.7217432273197651, "ground_truth": 0}, {"key": "0914e3c80a676e14e225504cb759103503f3f1e0", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.7620701005245718, "ground_truth": 0}, {"key": "0914e3c80a676e14e225504cb759103503f3f1e0", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.5717665978893497, "ground_truth": 0}, {"key": "0914e3c80a676e14e225504cb759103503f3f1e0", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.7025300359985023, "ground_truth": 0}, {"key": "82a0e1f034174079179821b052f33df76c781b47", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.11047116373948326, "ground_truth": 0}, {"key": "82a0e1f034174079179821b052f33df76c781b47", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.09534946677621604, "ground_truth": 0}, {"key": "82a0e1f034174079179821b052f33df76c781b47", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.07531230744851712, "ground_truth": 0}, {"key": "82a0e1f034174079179821b052f33df76c781b47", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.5039061637419281, "ground_truth": 0}, {"key": "82a0e1f034174079179821b052f33df76c781b47", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.043365800538646804, "ground_truth": 0}, {"key": "449c536051eba7070b18a7b33ebcf024891cb913", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.24798742340540073, "ground_truth": 0}, {"key": "449c536051eba7070b18a7b33ebcf024891cb913", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.10302442303763822, "ground_truth": 0}, {"key": "449c536051eba7070b18a7b33ebcf024891cb913", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.4186969312081764, "ground_truth": 0}, {"key": "449c536051eba7070b18a7b33ebcf024891cb913", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.09534946137142558, "ground_truth": 0}, {"key": "449c536051eba7070b18a7b33ebcf024891cb913", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.19930800882513838, "ground_truth": 0}, {"key": "696d5716c42ab1096cdb464da3cfcf702626a62a", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.6566582532253842, "ground_truth": 0}, {"key": "696d5716c42ab1096cdb464da3cfcf702626a62a", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.49609383484686276, "ground_truth": 0}, {"key": "696d5716c42ab1096cdb464da3cfcf702626a62a", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.47268345863331185, "ground_truth": 0}, {"key": "696d5716c42ab1096cdb464da3cfcf702626a62a", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.9504109721807783, "ground_truth": 0}, {"key": "696d5716c42ab1096cdb464da3cfcf702626a62a", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.48047866043835274, "ground_truth": 0}, {"key": "316f0f847800fdb547f7496f6095075cd610c7e4", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.7732163640573192, "ground_truth": 0}, {"key": "316f0f847800fdb547f7496f6095075cd610c7e4", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.8031737813684469, "ground_truth": 0}, {"key": "316f0f847800fdb547f7496f6095075cd610c7e4", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.7969253667663913, "ground_truth": 0}, {"key": "316f0f847800fdb547f7496f6095075cd610c7e4", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.6442250907983792, "ground_truth": 0}, {"key": "316f0f847800fdb547f7496f6095075cd610c7e4", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.7648916119882688, "ground_truth": 0}, {"key": "28e251ea722829df08d63e83824110fedcc13f8c", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.47073661757322294, "ground_truth": 0}, {"key": "28e251ea722829df08d63e83824110fedcc13f8c", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.6020615607979249, "ground_truth": 0}, {"key": "28e251ea722829df08d63e83824110fedcc13f8c", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.41869690779978014, "ground_truth": 0}, {"key": "28e251ea722829df08d63e83824110fedcc13f8c", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.15610491092941806, "ground_truth": 0}, {"key": "28e251ea722829df08d63e83824110fedcc13f8c", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.8140527964612795, "ground_truth": 0}, {"key": "4812698545d6a4c2243db340fad08d0b3b7fbe0b", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.27669050361707037, "ground_truth": 0}, {"key": "4812698545d6a4c2243db340fad08d0b3b7fbe0b", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.4551986116285541, "ground_truth": 0}, {"key": "4812698545d6a4c2243db340fad08d0b3b7fbe0b", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.5350984057712855, "ground_truth": 0}, {"key": "4812698545d6a4c2243db340fad08d0b3b7fbe0b", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.3056973379743832, "ground_truth": 0}, {"key": "4812698545d6a4c2243db340fad08d0b3b7fbe0b", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.23510839700065708, "ground_truth": 0}, {"key": "81651fc015f2db10f24327d11b1a3748a19466f9", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.29421496467459946, "ground_truth": 0}, {"key": "81651fc015f2db10f24327d11b1a3748a19466f9", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.1801066733647727, "ground_truth": 0}, {"key": "81651fc015f2db10f24327d11b1a3748a19466f9", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.12421300778331278, "ground_truth": 0}, {"key": "81651fc015f2db10f24327d11b1a3748a19466f9", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.17328818920522507, "ground_truth": 0}, {"key": "81651fc015f2db10f24327d11b1a3748a19466f9", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.187132668523444, "ground_truth": 0}, {"key": "f85e12129885fad0eabd6a1c6b6b24dbf8948db5", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.2479874354372306, "ground_truth": 0}, {"key": "f85e12129885fad0eabd6a1c6b6b24dbf8948db5", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.38676344478096186, "ground_truth": 0}, {"key": "f85e12129885fad0eabd6a1c6b6b24dbf8948db5", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.19806418488310895, "ground_truth": 0}, {"key": "f85e12129885fad0eabd6a1c6b6b24dbf8948db5", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.17106118750416113, "ground_truth": 0}, {"key": "f85e12129885fad0eabd6a1c6b6b24dbf8948db5", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.3904758216060354, "ground_truth": 0}, {"key": "bffa402002700855fec36f83c8c226dfe271a6af", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.7401743653421607, "ground_truth": 0}, {"key": "bffa402002700855fec36f83c8c226dfe271a6af", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.5058591091503091, "ground_truth": 0}, {"key": "bffa402002700855fec36f83c8c226dfe271a6af", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.5794003956829279, "ground_truth": 0}, {"key": "bffa402002700855fec36f83c8c226dfe271a6af", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.5175709196285682, "ground_truth": 0}, {"key": "bffa402002700855fec36f83c8c226dfe271a6af", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.49804690225356085, "ground_truth": 0}, {"key": "360df256327edcaf7ce0b99314adec8b0a2c5be6", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.31573596868560705, "ground_truth": 0}, {"key": "360df256327edcaf7ce0b99314adec8b0a2c5be6", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.24077458163514723, "ground_truth": 0}, {"key": "360df256327edcaf7ce0b99314adec8b0a2c5be6", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.31742625014535103, "ground_truth": 0}, {"key": "360df256327edcaf7ce0b99314adec8b0a2c5be6", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.11596071525930729, "ground_truth": 0}, {"key": "360df256327edcaf7ce0b99314adec8b0a2c5be6", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.23510839544708734, "ground_truth": 0}, {"key": "35ae4229bbd571d86bb817df03b3784dc8cbf660", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.3812195903397535, "ground_truth": 0}, {"key": "35ae4229bbd571d86bb817df03b3784dc8cbf660", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.6113819450277125, "ground_truth": 0}, {"key": "35ae4229bbd571d86bb817df03b3784dc8cbf660", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.3702254038666655, "ground_truth": 0}, {"key": "35ae4229bbd571d86bb817df03b3784dc8cbf660", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.550607366655653, "ground_truth": 0}, {"key": "35ae4229bbd571d86bb817df03b3784dc8cbf660", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.5214711442972684, "ground_truth": 0}, {"key": "fd93b423a3805de1c259d527393fd5fb75d06a55", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.35042137396108297, "ground_truth": 0}, {"key": "fd93b423a3805de1c259d527393fd5fb75d06a55", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.18594719967626405, "ground_truth": 0}, {"key": "fd93b423a3805de1c259d527393fd5fb75d06a55", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.10894503644582255, "ground_truth": 0}, {"key": "fd93b423a3805de1c259d527393fd5fb75d06a55", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.1520322567424067, "ground_truth": 0}, {"key": "fd93b423a3805de1c259d527393fd5fb75d06a55", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.11596072376404536, "ground_truth": 0}, {"key": "646676aabe72e75add3cde2d6afa56cea64c91a4", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.6706082666739067, "ground_truth": 0}, {"key": "646676aabe72e75add3cde2d6afa56cea64c91a4", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.809275973794144, "ground_truth": 0}, {"key": "646676aabe72e75add3cde2d6afa56cea64c91a4", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.8469578565715041, "ground_truth": 0}, {"key": "646676aabe72e75add3cde2d6afa56cea64c91a4", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.60766316994029, "ground_truth": 0}, {"key": "646676aabe72e75add3cde2d6afa56cea64c91a4", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.6132365750334998, "ground_truth": 0}, {"key": "5acf12b2ef7771fd1cd1421acb7057d9a64be818", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.5136684669221141, "ground_truth": 0}, {"key": "5acf12b2ef7771fd1cd1421acb7057d9a64be818", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.5312093624653145, "ground_truth": 0}, {"key": "5acf12b2ef7771fd1cd1421acb7057d9a64be818", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.49218814154855123, "ground_truth": 0}, {"key": "5acf12b2ef7771fd1cd1421acb7057d9a64be818", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.47073661803753236, "ground_truth": 0}, {"key": "5acf12b2ef7771fd1cd1421acb7057d9a64be818", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.7592254091475539, "ground_truth": 0}, {"key": "0239342f05436085947bd0c5173a4636ee772b51", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.15304215803266435, "ground_truth": 0}, {"key": "0239342f05436085947bd0c5173a4636ee772b51", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.19314737463224171, "ground_truth": 0}, {"key": "0239342f05436085947bd0c5173a4636ee772b51", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.15507847274341915, "ground_truth": 0}, {"key": "0239342f05436085947bd0c5173a4636ee772b51", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.11757213393107714, "ground_truth": 0}, {"key": "0239342f05436085947bd0c5173a4636ee772b51", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.262841831599946, "ground_truth": 0}, {"key": "1f40e358077ff22078a4e91e5114c4f86a4d52db", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.19930800558266498, "ground_truth": 0}, {"key": "1f40e358077ff22078a4e91e5114c4f86a4d52db", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.16026602156560066, "ground_truth": 0}, {"key": "1f40e358077ff22078a4e91e5114c4f86a4d52db", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.3415824897945843, "ground_truth": 0}, {"key": "1f40e358077ff22078a4e91e5114c4f86a4d52db", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.2323101552693383, "ground_truth": 0}, {"key": "1f40e358077ff22078a4e91e5114c4f86a4d52db", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.1931473736546619, "ground_truth": 0}, {"key": "a8ac682f29acaad4b669781c39fb2804374b8b2b", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.3174262991069517, "ground_truth": 0}, {"key": "a8ac682f29acaad4b669781c39fb2804374b8b2b", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.28616924572856095, "ground_truth": 0}, {"key": "a8ac682f29acaad4b669781c39fb2804374b8b2b", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.5156199154104776, "ground_truth": 0}, {"key": "a8ac682f29acaad4b669781c39fb2804374b8b2b", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.7185943750151722, "ground_truth": 0}, {"key": "a8ac682f29acaad4b669781c39fb2804374b8b2b", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.329391724504361, "ground_truth": 0}, {"key": "d4474ce9da725c1540ac826f3247f53d086808fb", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.4921881241176192, "ground_truth": 0}, {"key": "d4474ce9da725c1540ac826f3247f53d086808fb", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.43590152067888943, "ground_truth": 0}, {"key": "d4474ce9da725c1540ac826f3247f53d086808fb", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.3293917235743971, "ground_truth": 0}, {"key": "d4474ce9da725c1540ac826f3247f53d086808fb", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.35220181217163965, "ground_truth": 0}, {"key": "d4474ce9da725c1540ac826f3247f53d086808fb", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.43974734322249776, "ground_truth": 0}, {"key": "e74db6d20c456740ecb7b295c8d24489fb4f436f", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.2568319786148978, "ground_truth": 0}, {"key": "e74db6d20c456740ecb7b295c8d24489fb4f436f", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.3904758355842493, "ground_truth": 0}, {"key": "e74db6d20c456740ecb7b295c8d24489fb4f436f", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.26435833817815296, "ground_truth": 0}, {"key": "e74db6d20c456740ecb7b295c8d24489fb4f436f", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.15507846885696547, "ground_truth": 0}, {"key": "e74db6d20c456740ecb7b295c8d24489fb4f436f", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.26588047990374497, "ground_truth": 0}, {"key": "d79b790edcc3f5088161445102a656ae4adb8ab1", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.5175708960477943, "ground_truth": 0}, {"key": "d79b790edcc3f5088161445102a656ae4adb8ab1", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.3276683130304813, "ground_truth": 0}, {"key": "d79b790edcc3f5088161445102a656ae4adb8ab1", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.40356686338628456, "ground_truth": 0}, {"key": "d79b790edcc3f5088161445102a656ae4adb8ab1", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.5389832372936191, "ground_truth": 0}, {"key": "d79b790edcc3f5088161445102a656ae4adb8ab1", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.36658973726240013, "ground_truth": 0}, {"key": "47f028dbf53e028eb6636c85d8b3ee0de6a1de7b", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.7592254056633264, "ground_truth": 0}, {"key": "47f028dbf53e028eb6636c85d8b3ee0de6a1de7b", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.5774953708812467, "ground_truth": 0}, {"key": "47f028dbf53e028eb6636c85d8b3ee0de6a1de7b", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.8289387920405757, "ground_truth": 0}, {"key": "47f028dbf53e028eb6636c85d8b3ee0de6a1de7b", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.48633152261510054, "ground_truth": 0}, {"key": "47f028dbf53e028eb6636c85d8b3ee0de6a1de7b", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.5774953724445895, "ground_truth": 0}, {"key": "5f7a869908e864b70e83282b289ed1274c1f7f0d", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.15713685176179007, "ground_truth": 0}, {"key": "5f7a869908e864b70e83282b289ed1274c1f7f0d", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.36296920302819236, "ground_truth": 0}, {"key": "5f7a869908e864b70e83282b289ed1274c1f7f0d", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.3468731002319443, "ground_truth": 0}, {"key": "5f7a869908e864b70e83282b289ed1274c1f7f0d", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.21733751860278863, "ground_truth": 0}, {"key": "5f7a869908e864b70e83282b289ed1274c1f7f0d", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.206894056393541, "ground_truth": 0}, {"key": "59a9e7cad1c4c873738dda62b7e7b39bc2553710", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.5428632634067798, "ground_truth": 0}, {"key": "59a9e7cad1c4c873738dda62b7e7b39bc2553710", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.2628418312104186, "ground_truth": 0}, {"key": "59a9e7cad1c4c873738dda62b7e7b39bc2553710", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.42632158702548323, "ground_truth": 0}, {"key": "59a9e7cad1c4c873738dda62b7e7b39bc2553710", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.3593641270457359, "ground_truth": 0}, {"key": "59a9e7cad1c4c873738dda62b7e7b39bc2553710", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.4378234765656473, "ground_truth": 0}, {"key": "c47db89f5f9de3e599e2947ab7940eb65be0b433", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.09467770863958845, "ground_truth": 0}, {"key": "c47db89f5f9de3e599e2947ab7940eb65be0b433", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.18594719029231496, "ground_truth": 0}, {"key": "c47db89f5f9de3e599e2947ab7940eb65be0b433", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.19806416604642615, "ground_truth": 0}, {"key": "c47db89f5f9de3e599e2947ab7940eb65be0b433", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.38306416979658414, "ground_truth": 0}, {"key": "c47db89f5f9de3e599e2947ab7940eb65be0b433", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.29421496821825793, "ground_truth": 0}, {"key": "a74c3ff540cb154fc1294fd9d48b6a952329722b", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.33982761754337787, "ground_truth": 0}, {"key": "a74c3ff540cb154fc1294fd9d48b6a952329722b", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.6654105709028354, "ground_truth": 0}, {"key": "a74c3ff540cb154fc1294fd9d48b6a952329722b", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.30902369889372167, "ground_truth": 0}, {"key": "a74c3ff540cb154fc1294fd9d48b6a952329722b", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.3998116428196838, "ground_truth": 0}, {"key": "a74c3ff540cb154fc1294fd9d48b6a952329722b", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.646013715683977, "ground_truth": 0}, {"key": "f5692f8e01389a631dadcb70cfd4be3ff0ae45d3", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.3793783984111986, "ground_truth": 0}, {"key": "f5692f8e01389a631dadcb70cfd4be3ff0ae45d3", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.5869964338672357, "ground_truth": 0}, {"key": "f5692f8e01389a631dadcb70cfd4be3ff0ae45d3", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.5926666176269801, "ground_truth": 0}, {"key": "f5692f8e01389a631dadcb70cfd4be3ff0ae45d3", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.5136684680579167, "ground_truth": 0}, {"key": "f5692f8e01389a631dadcb70cfd4be3ff0ae45d3", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.5755880178182183, "ground_truth": 0}, {"key": "467e1b592518a5660d0a3b7eda24ef9574fe0d11", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.6566582778790437, "ground_truth": 0}, {"key": "467e1b592518a5660d0a3b7eda24ef9574fe0d11", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.3293916937656856, "ground_truth": 0}, {"key": "467e1b592518a5660d0a3b7eda24ef9574fe0d11", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.3738758019225216, "ground_truth": 0}, {"key": "467e1b592518a5660d0a3b7eda24ef9574fe0d11", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.49218815257988335, "ground_truth": 0}, {"key": "467e1b592518a5660d0a3b7eda24ef9574fe0d11", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.3942009616795882, "ground_truth": 0}, {"key": "61acf6de75325370728f6e290bafb01adc24a3ca", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.2173375148349868, "ground_truth": 0}, {"key": "61acf6de75325370728f6e290bafb01adc24a3ca", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.21733750805313376, "ground_truth": 0}, {"key": "61acf6de75325370728f6e290bafb01adc24a3ca", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.4610167597872978, "ground_truth": 0}, {"key": "61acf6de75325370728f6e290bafb01adc24a3ca", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.2674081485415196, "ground_truth": 0}, {"key": "61acf6de75325370728f6e290bafb01adc24a3ca", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.18359360103124173, "ground_truth": 0}, {"key": "172d2668b011501c20181b4925ebb6ba582f9a2f", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.5563995932154882, "ground_truth": 0}, {"key": "172d2668b011501c20181b4925ebb6ba582f9a2f", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.2613309349362504, "ground_truth": 0}, {"key": "172d2668b011501c20181b4925ebb6ba582f9a2f", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.21337717681924406, "ground_truth": 0}, {"key": "172d2668b011501c20181b4925ebb6ba582f9a2f", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.4765796308583296, "ground_truth": 0}, {"key": "172d2668b011501c20181b4925ebb6ba582f9a2f", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.4590761020782709, "ground_truth": 0}, {"key": "314c7c0104eb4113074619b3b3f1e9356114e2f5", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.33111973116684856, "ground_truth": 0}, {"key": "314c7c0104eb4113074619b3b3f1e9356114e2f5", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.7041601521565807, "ground_truth": 0}, {"key": "314c7c0104eb4113074619b3b3f1e9356114e2f5", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.7264256057179389, "ground_truth": 0}, {"key": "314c7c0104eb4113074619b3b3f1e9356114e2f5", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.3073580573118355, "ground_truth": 0}, {"key": "314c7c0104eb4113074619b3b3f1e9356114e2f5", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.7185943715732388, "ground_truth": 0}, {"key": "e66546893c2fa5fe38be74e1d1ed104f0c412b4d", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.5428632505415051, "ground_truth": 0}, {"key": "e66546893c2fa5fe38be74e1d1ed104f0c412b4d", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.26435834869779107, "ground_truth": 0}, {"key": "e66546893c2fa5fe38be74e1d1ed104f0c412b4d", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.22541661021347448, "ground_truth": 0}, {"key": "e66546893c2fa5fe38be74e1d1ed104f0c412b4d", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.27202455741309783, "ground_truth": 0}, {"key": "e66546893c2fa5fe38be74e1d1ed104f0c412b4d", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.2689414267888776, "ground_truth": 0}, {"key": "04882672036936ca86bdebed819a133539cbd296", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.28776781138540425, "ground_truth": 0}, {"key": "04882672036936ca86bdebed819a133539cbd296", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.13753245615875667, "ground_truth": 0}, {"key": "04882672036936ca86bdebed819a133539cbd296", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.2782567952217878, "ground_truth": 0}, {"key": "04882672036936ca86bdebed819a133539cbd296", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.2704802267626697, "ground_truth": 0}, {"key": "04882672036936ca86bdebed819a133539cbd296", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.1320661574944382, "ground_truth": 0}, {"key": "d5342fb6d8d522f336f2ce34eaa6e62446c0da2e", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.24077460351806915, "ground_truth": 0}, {"key": "d5342fb6d8d522f336f2ce34eaa6e62446c0da2e", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.17217185403737365, "ground_truth": 0}, {"key": "d5342fb6d8d522f336f2ce34eaa6e62446c0da2e", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.3575674931963868, "ground_truth": 0}, {"key": "d5342fb6d8d522f336f2ce34eaa6e62446c0da2e", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.19806416452918166, "ground_truth": 0}, {"key": "d5342fb6d8d522f336f2ce34eaa6e62446c0da2e", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.30902370131704876, "ground_truth": 0}, {"key": "87cdc5b797032387ea9bd0c9a0d7fd57c088e65b", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.5794003951717498, "ground_truth": 0}, {"key": "87cdc5b797032387ea9bd0c9a0d7fd57c088e65b", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.19314739373754974, "ground_truth": 0}, {"key": "87cdc5b797032387ea9bd0c9a0d7fd57c088e65b", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.8489721960529942, "ground_truth": 0}, {"key": "87cdc5b797032387ea9bd0c9a0d7fd57c088e65b", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.667147685050751, "ground_truth": 0}, {"key": "87cdc5b797032387ea9bd0c9a0d7fd57c088e65b", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.2689414137257566, "ground_truth": 0}, {"key": "4fd3285b643696cd49f08c14b0d482e559f32eed", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.32939171831942665, "ground_truth": 0}, {"key": "4fd3285b643696cd49f08c14b0d482e559f32eed", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.3942009536344139, "ground_truth": 0}, {"key": "4fd3285b643696cd49f08c14b0d482e559f32eed", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.17106119149820595, "ground_truth": 0}, {"key": "4fd3285b643696cd49f08c14b0d482e559f32eed", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.36658974693207785, "ground_truth": 0}, {"key": "4fd3285b643696cd49f08c14b0d482e559f32eed", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.3208212944376587, "ground_truth": 0}, {"key": "55930649e6f3cb285a26ef33525f8199bd86d089", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.15203225022588002, "ground_truth": 0}, {"key": "55930649e6f3cb285a26ef33525f8199bd86d089", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.12678517869839429, "ground_truth": 0}, {"key": "55930649e6f3cb285a26ef33525f8199bd86d089", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.11757213771458412, "ground_truth": 0}, {"key": "55930649e6f3cb285a26ef33525f8199bd86d089", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.2613309235637941, "ground_truth": 0}, {"key": "55930649e6f3cb285a26ef33525f8199bd86d089", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.26588047732294584, "ground_truth": 0}, {"key": "8b1c9d7c48a0d857ae857a21395a4996de051915", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.26133093076381725, "ground_truth": 0}, {"key": "8b1c9d7c48a0d857ae857a21395a4996de051915", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.27982848282832795, "ground_truth": 0}, {"key": "8b1c9d7c48a0d857ae857a21395a4996de051915", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.38676343253146794, "ground_truth": 0}, {"key": "8b1c9d7c48a0d857ae857a21395a4996de051915", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.3259494879864303, "ground_truth": 0}, {"key": "8b1c9d7c48a0d857ae857a21395a4996de051915", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.22953521916187894, "ground_truth": 0}, {"key": "d95dce003f0fccc57742bd900c81897c45208c10", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.15102781262044077, "ground_truth": 0}, {"key": "d95dce003f0fccc57742bd900c81897c45208c10", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.3684057014822553, "ground_truth": 0}, {"key": "d95dce003f0fccc57742bd900c81897c45208c10", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.2227001125191087, "ground_truth": 0}, {"key": "d95dce003f0fccc57742bd900c81897c45208c10", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.22678363669449778, "ground_truth": 0}, {"key": "d95dce003f0fccc57742bd900c81897c45208c10", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.26588047870088893, "ground_truth": 0}, {"key": "f732a658c314c090257225483075e4d9fde28b95", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.7563575776464488, "ground_truth": 0}, {"key": "f732a658c314c090257225483075e4d9fde28b95", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.8816149045539655, "ground_truth": 0}, {"key": "f732a658c314c090257225483075e4d9fde28b95", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.8749346050069092, "ground_truth": 0}, {"key": "f732a658c314c090257225483075e4d9fde28b95", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.7799928983865193, "ground_truth": 0}, {"key": "f732a658c314c090257225483075e4d9fde28b95", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.7520125712904733, "ground_truth": 0}, {"key": "cbd21ed724b7e4a075ab4ae9a45d9e86d6151283", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.13028540636411223, "ground_truth": 0}, {"key": "cbd21ed724b7e4a075ab4ae9a45d9e86d6151283", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.18476752068640906, "ground_truth": 0}, {"key": "cbd21ed724b7e4a075ab4ae9a45d9e86d6151283", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.1677633620767807, "ground_truth": 0}, {"key": "cbd21ed724b7e4a075ab4ae9a45d9e86d6151283", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.0973904047548051, "ground_truth": 0}, {"key": "cbd21ed724b7e4a075ab4ae9a45d9e86d6151283", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.16344542217993802, "ground_truth": 0}, {"key": "4a32d5f29cfb35f3a3966ee041fc1f358503f4b4", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.7826624677623872, "ground_truth": 0}, {"key": "4a32d5f29cfb35f3a3966ee041fc1f358503f4b4", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.7185943676518715, "ground_truth": 0}, {"key": "4a32d5f29cfb35f3a3966ee041fc1f358503f4b4", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.6619228665162397, "ground_truth": 0}, {"key": "4a32d5f29cfb35f3a3966ee041fc1f358503f4b4", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.7799928993459879, "ground_truth": 0}, {"key": "4a32d5f29cfb35f3a3966ee041fc1f358503f4b4", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.8386797623686177, "ground_truth": 0}, {"key": "d470c9860671ae720ccc7df115a46d471b4b900a", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.9294404025739832, "ground_truth": 0}, {"key": "d470c9860671ae720ccc7df115a46d471b4b900a", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.8092759882886518, "ground_truth": 0}, {"key": "d470c9860671ae720ccc7df115a46d471b4b900a", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.8529354710533309, "ground_truth": 0}, {"key": "d470c9860671ae720ccc7df115a46d471b4b900a", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.7461389928026326, "ground_truth": 0}, {"key": "d470c9860671ae720ccc7df115a46d471b4b900a", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.7853085879433569, "ground_truth": 0}, {"key": "55327ce32c4d5168e8e0fa7b5dabc9a8aafd9d78", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.2081789451594172, "ground_truth": 0}, {"key": "55327ce32c4d5168e8e0fa7b5dabc9a8aafd9d78", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.07807816390784952, "ground_truth": 0}, {"key": "55327ce32c4d5168e8e0fa7b5dabc9a8aafd9d78", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.05033063589746104, "ground_truth": 0}, {"key": "55327ce32c4d5168e8e0fa7b5dabc9a8aafd9d78", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.04778006487494663, "ground_truth": 0}, {"key": "55327ce32c4d5168e8e0fa7b5dabc9a8aafd9d78", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.15002882004132664, "ground_truth": 0}, {"key": "022c18def42072e28a37979c622c6ab7e31371de", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.26435835666064345, "ground_truth": 0}, {"key": "022c18def42072e28a37979c622c6ab7e31371de", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.5698526421099261, "ground_truth": 0}, {"key": "022c18def42072e28a37979c622c6ab7e31371de", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.3960681683708799, "ground_truth": 0}, {"key": "022c18def42072e28a37979c622c6ab7e31371de", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.3960681616866675, "ground_truth": 0}, {"key": "022c18def42072e28a37979c622c6ab7e31371de", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.3720487766279853, "ground_truth": 0}, {"key": "d49c8ddc7586fcc27a7d310a5cb7703f19e4607d", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.5156199211236413, "ground_truth": 0}, {"key": "d49c8ddc7586fcc27a7d310a5cb7703f19e4607d", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.5563995577188688, "ground_truth": 0}, {"key": "d49c8ddc7586fcc27a7d310a5cb7703f19e4607d", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.724870272570141, "ground_truth": 0}, {"key": "d49c8ddc7586fcc27a7d310a5cb7703f19e4607d", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.5214711536476276, "ground_truth": 0}, {"key": "d49c8ddc7586fcc27a7d310a5cb7703f19e4607d", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.7041601443521164, "ground_truth": 0}, {"key": "bda116dccb075585a67fd5dd5b759015c7577eb0", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.41489886675712495, "ground_truth": 0}, {"key": "bda116dccb075585a67fd5dd5b759015c7577eb0", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.6150878613382258, "ground_truth": 0}, {"key": "bda116dccb075585a67fd5dd5b759015c7577eb0", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.48242910953402696, "ground_truth": 0}, {"key": "bda116dccb075585a67fd5dd5b759015c7577eb0", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.6495786157906067, "ground_truth": 0}, {"key": "bda116dccb075585a67fd5dd5b759015c7577eb0", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.5350984030549009, "ground_truth": 0}, {"key": "ee0b1bc5ee40697c0792e3906000fe8be5be182a", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.47657967931274636, "ground_truth": 0}, {"key": "ee0b1bc5ee40697c0792e3906000fe8be5be182a", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.19436781625126695, "ground_truth": 0}, {"key": "ee0b1bc5ee40697c0792e3906000fe8be5be182a", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.4707366017830519, "ground_truth": 0}, {"key": "ee0b1bc5ee40697c0792e3906000fe8be5be182a", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.5019530871732529, "ground_truth": 0}, {"key": "ee0b1bc5ee40697c0792e3906000fe8be5be182a", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.41111088330918033, "ground_truth": 0}, {"key": "75b0d4c21581a1b0c1fc5798adba334d8ecc34f3", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.261330933234212, "ground_truth": 0}, {"key": "75b0d4c21581a1b0c1fc5798adba334d8ecc34f3", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.1744102827098158, "ground_truth": 0}, {"key": "75b0d4c21581a1b0c1fc5798adba334d8ecc34f3", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.3328523452077377, "ground_truth": 0}, {"key": "75b0d4c21581a1b0c1fc5798adba334d8ecc34f3", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.22405543990159205, "ground_truth": 0}, {"key": "75b0d4c21581a1b0c1fc5798adba334d8ecc34f3", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.4359015134421657, "ground_truth": 0}, {"key": "3f7e19cffef13f356e2298c5a63e6c8db20f3d91", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.3363310441507598, "ground_truth": 0}, {"key": "3f7e19cffef13f356e2298c5a63e6c8db20f3d91", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.40356685070440307, "ground_truth": 0}, {"key": "3f7e19cffef13f356e2298c5a63e6c8db20f3d91", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.46684559068354575, "ground_truth": 0}, {"key": "3f7e19cffef13f356e2298c5a63e6c8db20f3d91", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.43014736721147356, "ground_truth": 0}, {"key": "3f7e19cffef13f356e2298c5a63e6c8db20f3d91", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.3208212866063617, "ground_truth": 0}, {"key": "00359f516cdf8b1800c7102711bd9aa400d1c749", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.09947020875159877, "ground_truth": 0}, {"key": "00359f516cdf8b1800c7102711bd9aa400d1c749", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.16238002895096332, "ground_truth": 0}, {"key": "00359f516cdf8b1800c7102711bd9aa400d1c749", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.1490352779603339, "ground_truth": 0}, {"key": "00359f516cdf8b1800c7102711bd9aa400d1c749", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.13477592047289808, "ground_truth": 0}, {"key": "00359f516cdf8b1800c7102711bd9aa400d1c749", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.09534946604358553, "ground_truth": 0}, {"key": "f8be2f5ce06cb4af91cbb7b6bef9835991751ef5", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.5679365890409234, "ground_truth": 0}, {"key": "f8be2f5ce06cb4af91cbb7b6bef9835991751ef5", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.2628418380660325, "ground_truth": 0}, {"key": "f8be2f5ce06cb4af91cbb7b6bef9835991751ef5", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.256831996735081, "ground_truth": 0}, {"key": "f8be2f5ce06cb4af91cbb7b6bef9835991751ef5", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.1919327888852193, "ground_truth": 0}, {"key": "f8be2f5ce06cb4af91cbb7b6bef9835991751ef5", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.2845759978402051, "ground_truth": 0}, {"key": "958a67b8550998886478275b404e2256a6b85c7c", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.1980641835166887, "ground_truth": 0}, {"key": "958a67b8550998886478275b404e2256a6b85c7c", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.3468730827474414, "ground_truth": 0}, {"key": "958a67b8550998886478275b404e2256a6b85c7c", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.23510837699835663, "ground_truth": 0}, {"key": "958a67b8550998886478275b404e2256a6b85c7c", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.0987725878661235, "ground_truth": 0}, {"key": "958a67b8550998886478275b404e2256a6b85c7c", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.12336562093901583, "ground_truth": 0}, {"key": "4739f160c87994f52e894591194f5df06fed4c39", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.6150878579809113, "ground_truth": 0}, {"key": "4739f160c87994f52e894591194f5df06fed4c39", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.517570909504946, "ground_truth": 0}, {"key": "4739f160c87994f52e894591194f5df06fed4c39", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.6584175229976165, "ground_truth": 0}, {"key": "4739f160c87994f52e894591194f5df06fed4c39", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.4263215826070185, "ground_truth": 0}, {"key": "4739f160c87994f52e894591194f5df06fed4c39", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.4687906476609895, "ground_truth": 0}, {"key": "027a99a889b38fdb935cd14c204a5fca8a329bc1", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.23370635756678534, "ground_truth": 0}, {"key": "027a99a889b38fdb935cd14c204a5fca8a329bc1", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.368405709285688, "ground_truth": 0}, {"key": "027a99a889b38fdb935cd14c204a5fca8a329bc1", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.22953519998459607, "ground_truth": 0}, {"key": "027a99a889b38fdb935cd14c204a5fca8a329bc1", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.3208212921970197, "ground_truth": 0}, {"key": "027a99a889b38fdb935cd14c204a5fca8a329bc1", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.40356685472775244, "ground_truth": 0}, {"key": "c7c83a9ee902e568a55898c616f20181952ce057", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.1311732219779761, "ground_truth": 0}, {"key": "c7c83a9ee902e568a55898c616f20181952ce057", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.2309197703225659, "ground_truth": 0}, {"key": "c7c83a9ee902e568a55898c616f20181952ce057", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.21337715996724246, "ground_truth": 0}, {"key": "c7c83a9ee902e568a55898c616f20181952ce057", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.2658804591786027, "ground_truth": 0}, {"key": "c7c83a9ee902e568a55898c616f20181952ce057", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.14511535279496668, "ground_truth": 0}, {"key": "7bff6a60ff0b62855bd28562bb820233c0c940e0", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.7041601218230243, "ground_truth": 0}, {"key": "7bff6a60ff0b62855bd28562bb820233c0c940e0", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.5794004042479272, "ground_truth": 0}, {"key": "7bff6a60ff0b62855bd28562bb820233c0c940e0", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.4513264850692493, "ground_truth": 0}, {"key": "7bff6a60ff0b62855bd28562bb820233c0c940e0", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.5544704714557069, "ground_truth": 0}, {"key": "7bff6a60ff0b62855bd28562bb820233c0c940e0", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.4921881316366085, "ground_truth": 0}, {"key": "5ba5e49e25610f42416b2e7ba76d7496acab0f78", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.25386101937013394, "ground_truth": 0}, {"key": "5ba5e49e25610f42416b2e7ba76d7496acab0f78", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.4225046503138217, "ground_truth": 0}, {"key": "5ba5e49e25610f42416b2e7ba76d7496acab0f78", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.3886180469240933, "ground_truth": 0}, {"key": "5ba5e49e25610f42416b2e7ba76d7496acab0f78", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.4359015270233742, "ground_truth": 0}, {"key": "5ba5e49e25610f42416b2e7ba76d7496acab0f78", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.5214711634095346, "ground_truth": 0}, {"key": "0961a6a9fef7ad978ab866a57415578a49ba187f", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.31573599336782066, "ground_truth": 0}, {"key": "0961a6a9fef7ad978ab866a57415578a49ba187f", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.3575675272523061, "ground_truth": 0}, {"key": "0961a6a9fef7ad978ab866a57415578a49ba187f", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.2942149726237946, "ground_truth": 0}, {"key": "0961a6a9fef7ad978ab866a57415578a49ba187f", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.3998116303767034, "ground_truth": 0}, {"key": "0961a6a9fef7ad978ab866a57415578a49ba187f", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.44360042688067886, "ground_truth": 0}, {"key": "94148575d23050ffbedb00bddbd826d7137a4fe4", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.4687906288652925, "ground_truth": 0}, {"key": "94148575d23050ffbedb00bddbd826d7137a4fe4", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.2568319795272295, "ground_truth": 0}, {"key": "94148575d23050ffbedb00bddbd826d7137a4fe4", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.394200957602329, "ground_truth": 0}, {"key": "94148575d23050ffbedb00bddbd826d7137a4fe4", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.23370634877867097, "ground_truth": 0}, {"key": "94148575d23050ffbedb00bddbd826d7137a4fe4", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.4532618400374798, "ground_truth": 0}, {"key": "aaa346e0be1ef1b9c2ce152c859b30e364ea3bc0", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.6261241716355203, "ground_truth": 0}, {"key": "aaa346e0be1ef1b9c2ce152c859b30e364ea3bc0", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.2674081410628011, "ground_truth": 0}, {"key": "aaa346e0be1ef1b9c2ce152c859b30e364ea3bc0", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.27669054136033083, "ground_truth": 0}, {"key": "aaa346e0be1ef1b9c2ce152c859b30e364ea3bc0", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.5039061761181474, "ground_truth": 0}, {"key": "aaa346e0be1ef1b9c2ce152c859b30e364ea3bc0", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.3904758538545963, "ground_truth": 0}, {"key": "7604af04967436c4aaf0c7df8b09afcec82f5be0", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.3242354097425593, "ground_truth": 0}, {"key": "7604af04967436c4aaf0c7df8b09afcec82f5be0", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.2043419023952415, "ground_truth": 0}, {"key": "7604af04967436c4aaf0c7df8b09afcec82f5be0", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.22000709130224366, "ground_truth": 0}, {"key": "7604af04967436c4aaf0c7df8b09afcec82f5be0", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.3191213825062925, "ground_truth": 0}, {"key": "7604af04967436c4aaf0c7df8b09afcec82f5be0", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.5544704703365888, "ground_truth": 0}, {"key": "1be68b94413120c0b2c7514ffd14b9cfc4413f90", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.16344544587593723, "ground_truth": 0}, {"key": "1be68b94413120c0b2c7514ffd14b9cfc4413f90", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.1789558821602337, "ground_truth": 0}, {"key": "1be68b94413120c0b2c7514ffd14b9cfc4413f90", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.213377179789928, "ground_truth": 0}, {"key": "1be68b94413120c0b2c7514ffd14b9cfc4413f90", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.19559406065922982, "ground_truth": 0}, {"key": "1be68b94413120c0b2c7514ffd14b9cfc4413f90", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.13296423295613258, "ground_truth": 0}, {"key": "44fc3a2bc441a674f1ebdeabae73278977909db4", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.7446563235538595, "ground_truth": 0}, {"key": "44fc3a2bc441a674f1ebdeabae73278977909db4", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.5370413684850349, "ground_truth": 0}, {"key": "44fc3a2bc441a674f1ebdeabae73278977909db4", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.7122321980138783, "ground_truth": 0}, {"key": "44fc3a2bc441a674f1ebdeabae73278977909db4", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.6460136906247814, "ground_truth": 0}, {"key": "44fc3a2bc441a674f1ebdeabae73278977909db4", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.8489722198283578, "ground_truth": 0}, {"key": "fbb06b75e3963c5a810c9f73e4dc5382fbcb7405", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.5660185474422129, "ground_truth": 0}, {"key": "fbb06b75e3963c5a810c9f73e4dc5382fbcb7405", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.6113820029695461, "ground_truth": 0}, {"key": "fbb06b75e3963c5a810c9f73e4dc5382fbcb7405", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.3904758305375438, "ground_truth": 0}, {"key": "fbb06b75e3963c5a810c9f73e4dc5382fbcb7405", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.4130035565071939, "ground_truth": 0}, {"key": "fbb06b75e3963c5a810c9f73e4dc5382fbcb7405", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.7154240067330386, "ground_truth": 0}, {"key": "551839469c1133ef4697ed435c5de192e6076858", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.40168781864704417, "ground_truth": 0}, {"key": "551839469c1133ef4697ed435c5de192e6076858", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.496093816492824, "ground_truth": 0}, {"key": "551839469c1133ef4697ed435c5de192e6076858", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.6619228677738875, "ground_truth": 0}, {"key": "551839469c1133ef4697ed435c5de192e6076858", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.5039061810726245, "ground_truth": 0}, {"key": "551839469c1133ef4697ed435c5de192e6076858", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.5660185229522545, "ground_truth": 0}, {"key": "386e149797954c4b5cd52bcad0beece29f7eb04a", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.4073333910869885, "ground_truth": 0}, {"key": "386e149797954c4b5cd52bcad0beece29f7eb04a", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.3504213673263383, "ground_truth": 0}, {"key": "386e149797954c4b5cd52bcad0beece29f7eb04a", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.5409238548606708, "ground_truth": 0}, {"key": "386e149797954c4b5cd52bcad0beece29f7eb04a", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.2877678161332235, "ground_truth": 0}, {"key": "386e149797954c4b5cd52bcad0beece29f7eb04a", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.34687306775055476, "ground_truth": 0}, {"key": "25abfd6bf83eb62bdd4daf1f542d61b54ab2871d", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.6723316760351385, "ground_truth": 0}, {"key": "25abfd6bf83eb62bdd4daf1f542d61b54ab2871d", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.7490872062035226, "ground_truth": 0}, {"key": "25abfd6bf83eb62bdd4daf1f542d61b54ab2871d", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.6601723974343174, "ground_truth": 0}, {"key": "25abfd6bf83eb62bdd4daf1f542d61b54ab2871d", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.7057850093929962, "ground_truth": 0}, {"key": "25abfd6bf83eb62bdd4daf1f542d61b54ab2871d", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.6187804199776128, "ground_truth": 0}, {"key": "e5e0f9ea6381d513d4632644634d7c12e1c6c4cb", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.4167966350492221, "ground_truth": 0}, {"key": "e5e0f9ea6381d513d4632644634d7c12e1c6c4cb", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.4301473472591709, "ground_truth": 0}, {"key": "e5e0f9ea6381d513d4632644634d7c12e1c6c4cb", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.3468730724035842, "ground_truth": 0}, {"key": "e5e0f9ea6381d513d4632644634d7c12e1c6c4cb", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.18713268923533233, "ground_truth": 0}, {"key": "e5e0f9ea6381d513d4632644634d7c12e1c6c4cb", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.09807932200981812, "ground_truth": 0}, {"key": "4e660c57fb36c03622b3ff9f9d0e78a0f7b0aea9", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.1338674771967914, "ground_truth": 0}, {"key": "4e660c57fb36c03622b3ff9f9d0e78a0f7b0aea9", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.2160115366461882, "ground_truth": 0}, {"key": "4e660c57fb36c03622b3ff9f9d0e78a0f7b0aea9", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.14414883851043292, "ground_truth": 0}, {"key": "4e660c57fb36c03622b3ff9f9d0e78a0f7b0aea9", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.4130035583406708, "ground_truth": 0}, {"key": "4e660c57fb36c03622b3ff9f9d0e78a0f7b0aea9", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.21469142425735724, "ground_truth": 0}, {"key": "586458cf89c9c2ddc5a7925e275f135245f5a0fc", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.47657964972975897, "ground_truth": 0}, {"key": "586458cf89c9c2ddc5a7925e275f135245f5a0fc", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.16667538757963313, "ground_truth": 0}, {"key": "586458cf89c9c2ddc5a7925e275f135245f5a0fc", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.35756750487227706, "ground_truth": 0}, {"key": "586458cf89c9c2ddc5a7925e275f135245f5a0fc", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.49218813184401616, "ground_truth": 0}, {"key": "586458cf89c9c2ddc5a7925e275f135245f5a0fc", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.22953519966247796, "ground_truth": 0}, {"key": "8aca433d3662b6ffe76ef4026bdcd7cf784aacec", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.12940273337073804, "ground_truth": 0}, {"key": "8aca433d3662b6ffe76ef4026bdcd7cf784aacec", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.1412814111292786, "ground_truth": 0}, {"key": "8aca433d3662b6ffe76ef4026bdcd7cf784aacec", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.2814055983969034, "ground_truth": 0}, {"key": "8aca433d3662b6ffe76ef4026bdcd7cf784aacec", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.17441028015293916, "ground_truth": 0}, {"key": "8aca433d3662b6ffe76ef4026bdcd7cf784aacec", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.33285232018962585, "ground_truth": 0}, {"key": "066f8568d9c1c23ca3aeb23330123e7dd8967208", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.6460137025685114, "ground_truth": 0}, {"key": "066f8568d9c1c23ca3aeb23330123e7dd8967208", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.6150878620347852, "ground_truth": 0}, {"key": "066f8568d9c1c23ca3aeb23330123e7dd8967208", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.5717666035199978, "ground_truth": 0}, {"key": "066f8568d9c1c23ca3aeb23330123e7dd8967208", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.6095241904854117, "ground_truth": 0}, {"key": "066f8568d9c1c23ca3aeb23330123e7dd8967208", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.602061557842163, "ground_truth": 0}, {"key": "6589398915f67576609586704d5bcca6538c4727", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.5621764945127206, "ground_truth": 0}, {"key": "6589398915f67576609586704d5bcca6538c4727", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.6132365553931222, "ground_truth": 0}, {"key": "6589398915f67576609586704d5bcca6538c4727", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.5370414105655523, "ground_truth": 0}, {"key": "6589398915f67576609586704d5bcca6538c4727", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.8322366393840964, "ground_truth": 0}, {"key": "6589398915f67576609586704d5bcca6538c4727", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.6206216174845736, "ground_truth": 0}, {"key": "cb4d9818866490b281e8f5529c9957ba366390e7", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.28457600004849015, "ground_truth": 0}, {"key": "cb4d9818866490b281e8f5529c9957ba366390e7", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.25534366981510875, "ground_truth": 0}, {"key": "cb4d9818866490b281e8f5529c9957ba366390e7", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.22953521153738377, "ground_truth": 0}, {"key": "cb4d9818866490b281e8f5529c9957ba366390e7", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.07159119868497854, "ground_truth": 0}, {"key": "cb4d9818866490b281e8f5529c9957ba366390e7", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.32252597259344784, "ground_truth": 0}, {"key": "83181eb5628b02f9af1cf8be0b9e3d7841f6f94c", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.4301473367140634, "ground_truth": 0}, {"key": "83181eb5628b02f9af1cf8be0b9e3d7841f6f94c", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.3593641447480943, "ground_truth": 0}, {"key": "83181eb5628b02f9af1cf8be0b9e3d7841f6f94c", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.5039061745890717, "ground_truth": 0}, {"key": "83181eb5628b02f9af1cf8be0b9e3d7841f6f94c", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.6992544283237205, "ground_truth": 0}, {"key": "83181eb5628b02f9af1cf8be0b9e3d7841f6f94c", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.35220177614640463, "ground_truth": 0}, {"key": "addda21620885e1019305bce0cbf308b421dc0ba", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.20307463401416678, "ground_truth": 0}, {"key": "addda21620885e1019305bce0cbf308b421dc0ba", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.11596071786206828, "ground_truth": 0}, {"key": "addda21620885e1019305bce0cbf308b421dc0ba", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.18126319379698674, "ground_truth": 0}, {"key": "addda21620885e1019305bce0cbf308b421dc0ba", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.259825638787232, "ground_truth": 0}, {"key": "addda21620885e1019305bce0cbf308b421dc0ba", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.29583986638109117, "ground_truth": 0}, {"key": "6a0a6f44de4059e1d7ef83841b3fd5e95e278ba2", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.20561504560870345, "ground_truth": 0}, {"key": "6a0a6f44de4059e1d7ef83841b3fd5e95e278ba2", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.1766716116177767, "ground_truth": 0}, {"key": "6a0a6f44de4059e1d7ef83841b3fd5e95e278ba2", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.2120688183792706, "ground_truth": 0}, {"key": "6a0a6f44de4059e1d7ef83841b3fd5e95e278ba2", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.35756752722077784, "ground_truth": 0}, {"key": "6a0a6f44de4059e1d7ef83841b3fd5e95e278ba2", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.24653335003969223, "ground_truth": 0}, {"key": "b5313efdec6d9afa6f43f26378c6065fcc9c7535", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.2598256454258159, "ground_truth": 0}, {"key": "b5313efdec6d9afa6f43f26378c6065fcc9c7535", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.2160115553289734, "ground_truth": 0}, {"key": "b5313efdec6d9afa6f43f26378c6065fcc9c7535", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.346873081639816, "ground_truth": 0}, {"key": "b5313efdec6d9afa6f43f26378c6065fcc9c7535", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.6671476586434513, "ground_truth": 0}, {"key": "b5313efdec6d9afa6f43f26378c6065fcc9c7535", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.45326183545821574, "ground_truth": 0}, {"key": "0644f27692b67af8f52f9518e29981de11684cd7", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.6706082584794085, "ground_truth": 0}, {"key": "0644f27692b67af8f52f9518e29981de11684cd7", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.43974735103643925, "ground_truth": 0}, {"key": "0644f27692b67af8f52f9518e29981de11684cd7", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.6242935490731955, "ground_truth": 0}, {"key": "0644f27692b67af8f52f9518e29981de11684cd7", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.869714581811489, "ground_truth": 0}, {"key": "0644f27692b67af8f52f9518e29981de11684cd7", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.629774614997809, "ground_truth": 0}, {"key": "19dbfe3918d9bdd7b5f1792631c5e3e424146473", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.34158250102937265, "ground_truth": 0}, {"key": "19dbfe3918d9bdd7b5f1792631c5e3e424146473", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.48828338862292575, "ground_truth": 0}, {"key": "19dbfe3918d9bdd7b5f1792631c5e3e424146473", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.357567502573774, "ground_truth": 0}, {"key": "19dbfe3918d9bdd7b5f1792631c5e3e424146473", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.3345894257615778, "ground_truth": 0}, {"key": "19dbfe3918d9bdd7b5f1792631c5e3e424146473", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.3557748960506718, "ground_truth": 0}, {"key": "0f4fcaf8fd58c40bc31c4715cd230bb0f80f2d98", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.33807710940836805, "ground_truth": 0}, {"key": "0f4fcaf8fd58c40bc31c4715cd230bb0f80f2d98", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.21866938135000807, "ground_truth": 0}, {"key": "0f4fcaf8fd58c40bc31c4715cd230bb0f80f2d98", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.13028541227146678, "ground_truth": 0}, {"key": "0f4fcaf8fd58c40bc31c4715cd230bb0f80f2d98", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.12852512235233873, "ground_truth": 0}, {"key": "0f4fcaf8fd58c40bc31c4715cd230bb0f80f2d98", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.16776334927101838, "ground_truth": 0}, {"key": "4aa90d4a364e8bd252a2a2e57f1bb4c9dab57062", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.5794004270740558, "ground_truth": 0}, {"key": "4aa90d4a364e8bd252a2a2e57f1bb4c9dab57062", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.5234203443025872, "ground_truth": 0}, {"key": "4aa90d4a364e8bd252a2a2e57f1bb4c9dab57062", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.23091976301534578, "ground_truth": 0}, {"key": "4aa90d4a364e8bd252a2a2e57f1bb4c9dab57062", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.26435835908072863, "ground_truth": 0}, {"key": "4aa90d4a364e8bd252a2a2e57f1bb4c9dab57062", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.521471177969139, "ground_truth": 0}, {"key": "239d0e3b504e4b9e1e6eb20eb77c8a873a2f5657", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.5736784146760222, "ground_truth": 0}, {"key": "239d0e3b504e4b9e1e6eb20eb77c8a873a2f5657", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.40168780053233244, "ground_truth": 0}, {"key": "239d0e3b504e4b9e1e6eb20eb77c8a873a2f5657", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.4225046227175977, "ground_truth": 0}, {"key": "239d0e3b504e4b9e1e6eb20eb77c8a873a2f5657", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.7279754286535107, "ground_truth": 0}, {"key": "239d0e3b504e4b9e1e6eb20eb77c8a873a2f5657", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.6791787072697122, "ground_truth": 0}, {"key": "6ef705715b84a961f971d624e9574da6a65dd3ef", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.24364244691361445, "ground_truth": 0}, {"key": "6ef705715b84a961f971d624e9574da6a65dd3ef", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.27669053120323206, "ground_truth": 0}, {"key": "6ef705715b84a961f971d624e9574da6a65dd3ef", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.2450850121571159, "ground_truth": 0}, {"key": "6ef705715b84a961f971d624e9574da6a65dd3ef", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.3775406713120846, "ground_truth": 0}, {"key": "6ef705715b84a961f971d624e9574da6a65dd3ef", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.5736784216703535, "ground_truth": 0}, {"key": "e3f24714630bd679c4b4fdb77e90f785beb1ff33", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.2309197753264721, "ground_truth": 0}, {"key": "e3f24714630bd679c4b4fdb77e90f785beb1ff33", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.2450850200354097, "ground_truth": 0}, {"key": "e3f24714630bd679c4b4fdb77e90f785beb1ff33", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.3191213830534958, "ground_truth": 0}, {"key": "e3f24714630bd679c4b4fdb77e90f785beb1ff33", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.45907613513247314, "ground_truth": 0}, {"key": "e3f24714630bd679c4b4fdb77e90f785beb1ff33", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.20055768290627365, "ground_truth": 0}, {"key": "589dc58218fe8920f0949cc7af767b6daf5018bc", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.09877258298190633, "ground_truth": 0}, {"key": "589dc58218fe8920f0949cc7af767b6daf5018bc", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.16885694909435067, "ground_truth": 0}, {"key": "589dc58218fe8920f0949cc7af767b6daf5018bc", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.156104891801507, "ground_truth": 0}, {"key": "589dc58218fe8920f0949cc7af767b6daf5018bc", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.13028542332998627, "ground_truth": 0}, {"key": "589dc58218fe8920f0949cc7af767b6daf5018bc", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.3665897409999264, "ground_truth": 0}, {"key": "06254d21e94c9c0b027629a1df90298887c31f14", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.18126319795758297, "ground_truth": 0}, {"key": "06254d21e94c9c0b027629a1df90298887c31f14", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.32423539317475886, "ground_truth": 0}, {"key": "06254d21e94c9c0b027629a1df90298887c31f14", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.21866938881557094, "ground_truth": 0}, {"key": "06254d21e94c9c0b027629a1df90298887c31f14", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.10743746717355236, "ground_truth": 0}, {"key": "06254d21e94c9c0b027629a1df90298887c31f14", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.16026604068793826, "ground_truth": 0}, {"key": "5b93cafa2843ab23eb5baf8bb0bec93d0fc46864", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.7981867761563574, "ground_truth": 0}, {"key": "5b93cafa2843ab23eb5baf8bb0bec93d0fc46864", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.7138307441637395, "ground_truth": 0}, {"key": "5b93cafa2843ab23eb5baf8bb0bec93d0fc46864", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.77999290514332, "ground_truth": 0}, {"key": "5b93cafa2843ab23eb5baf8bb0bec93d0fc46864", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.7386690725279388, "ground_truth": 0}, {"key": "5b93cafa2843ab23eb5baf8bb0bec93d0fc46864", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.808067204295297, "ground_truth": 0}, {"key": "22f9667453cf7ea8a39080edde645776d5edc6f7", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.2735744059407773, "ground_truth": 0}, {"key": "22f9667453cf7ea8a39080edde645776d5edc6f7", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.5428632909338384, "ground_truth": 0}, {"key": "22f9667453cf7ea8a39080edde645776d5edc6f7", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.24944723588523304, "ground_truth": 0}, {"key": "22f9667453cf7ea8a39080edde645776d5edc6f7", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.12506538550228666, "ground_truth": 0}, {"key": "22f9667453cf7ea8a39080edde645776d5edc6f7", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.30074557311390265, "ground_truth": 0}, {"key": "521fc18da417d441ba600a4abdbf279bb0c8f69d", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.1267851882663183, "ground_truth": 0}, {"key": "521fc18da417d441ba600a4abdbf279bb0c8f69d", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.3611647389817883, "ground_truth": 0}, {"key": "521fc18da417d441ba600a4abdbf279bb0c8f69d", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.6566582813630224, "ground_truth": 0}, {"key": "521fc18da417d441ba600a4abdbf279bb0c8f69d", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.1871326973057053, "ground_truth": 0}, {"key": "521fc18da417d441ba600a4abdbf279bb0c8f69d", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.5039061973157112, "ground_truth": 0}, {"key": "48fd5553806beaaa508596b0c8267a1ee703a8fe", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.2337063494651763, "ground_truth": 0}, {"key": "48fd5553806beaaa508596b0c8267a1ee703a8fe", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.32252597391916055, "ground_truth": 0}, {"key": "48fd5553806beaaa508596b0c8267a1ee703a8fe", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.24077458581285047, "ground_truth": 0}, {"key": "48fd5553806beaaa508596b0c8267a1ee703a8fe", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.490235616235467, "ground_truth": 0}, {"key": "48fd5553806beaaa508596b0c8267a1ee703a8fe", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.3904758288868406, "ground_truth": 0}, {"key": "f9b3e0253b7325cd0d37841a38c9f10a22c77c49", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.39793841667820173, "ground_truth": 0}, {"key": "f9b3e0253b7325cd0d37841a38c9f10a22c77c49", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.4824291155857326, "ground_truth": 0}, {"key": "f9b3e0253b7325cd0d37841a38c9f10a22c77c49", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.45907613550050985, "ground_truth": 0}, {"key": "f9b3e0253b7325cd0d37841a38c9f10a22c77c49", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.611381952188402, "ground_truth": 0}, {"key": "f9b3e0253b7325cd0d37841a38c9f10a22c77c49", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.13296423398248383, "ground_truth": 0}, {"key": "3228a9d82b3829a4f09698b746db4036ebb38ad0", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.355774847865058, "ground_truth": 0}, {"key": "3228a9d82b3829a4f09698b746db4036ebb38ad0", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.28937169074034286, "ground_truth": 0}, {"key": "3228a9d82b3829a4f09698b746db4036ebb38ad0", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.4980468514149342, "ground_truth": 0}, {"key": "3228a9d82b3829a4f09698b746db4036ebb38ad0", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.2107663078783454, "ground_truth": 0}, {"key": "3228a9d82b3829a4f09698b746db4036ebb38ad0", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.5136684881747275, "ground_truth": 0}, {"key": "ee02f2bd6eaf55c06fef208248197679d2d96897", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.09807932298411721, "ground_truth": 0}, {"key": "ee02f2bd6eaf55c06fef208248197679d2d96897", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.4493926226480944, "ground_truth": 0}, {"key": "ee02f2bd6eaf55c06fef208248197679d2d96897", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.3311197128628951, "ground_truth": 0}, {"key": "ee02f2bd6eaf55c06fef208248197679d2d96897", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.15610489463699173, "ground_truth": 0}, {"key": "ee02f2bd6eaf55c06fef208248197679d2d96897", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.2568320022794341, "ground_truth": 0}, {"key": "c8da607c6ffe49104ceacd4fe484581042e7f21a", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.12252322677438461, "ground_truth": 0}, {"key": "c8da607c6ffe49104ceacd4fe484581042e7f21a", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.13846179639577422, "ground_truth": 0}, {"key": "c8da607c6ffe49104ceacd4fe484581042e7f21a", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.09877258484641963, "ground_truth": 0}, {"key": "c8da607c6ffe49104ceacd4fe484581042e7f21a", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.12765261376702877, "ground_truth": 0}, {"key": "c8da607c6ffe49104ceacd4fe484581042e7f21a", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.2509127936181165, "ground_truth": 0}, {"key": "aeca50944e5a49735193304117849531fb4d667d", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.2658804706241013, "ground_truth": 0}, {"key": "aeca50944e5a49735193304117849531fb4d667d", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.1778108632056251, "ground_truth": 0}, {"key": "aeca50944e5a49735193304117849531fb4d667d", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.15713685969243626, "ground_truth": 0}, {"key": "aeca50944e5a49735193304117849531fb4d667d", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.42632157969398765, "ground_truth": 0}, {"key": "aeca50944e5a49735193304117849531fb4d667d", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.14318770222382987, "ground_truth": 0}, {"key": "301c27b4468420252a14f4c87c2b208c6b3259e1", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.7106282967567842, "ground_truth": 0}, {"key": "301c27b4468420252a14f4c87c2b208c6b3259e1", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.18126319906322116, "ground_truth": 0}, {"key": "301c27b4468420252a14f4c87c2b208c6b3259e1", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.10594827633011301, "ground_truth": 0}, {"key": "301c27b4468420252a14f4c87c2b208c6b3259e1", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.18832397871640466, "ground_truth": 0}, {"key": "301c27b4468420252a14f4c87c2b208c6b3259e1", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.16132022825502665, "ground_truth": 0}, {"key": "9b5fc45f61bff9323a7744c1db605618763cb85c", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.3486451303923831, "ground_truth": 0}, {"key": "9b5fc45f61bff9323a7744c1db605618763cb85c", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.6020615842846887, "ground_truth": 0}, {"key": "9b5fc45f61bff9323a7744c1db605618763cb85c", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.1883239534016399, "ground_truth": 0}, {"key": "9b5fc45f61bff9323a7744c1db605618763cb85c", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.2309197683625301, "ground_truth": 0}, {"key": "9b5fc45f61bff9323a7744c1db605618763cb85c", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.5292634112738067, "ground_truth": 0}, {"key": "43144b95b0f947f2c6d40122fecd69ced8a4af92", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.5583269890887115, "ground_truth": 0}, {"key": "43144b95b0f947f2c6d40122fecd69ced8a4af92", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.5136684525610599, "ground_truth": 0}, {"key": "43144b95b0f947f2c6d40122fecd69ced8a4af92", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.41300359933898934, "ground_truth": 0}, {"key": "43144b95b0f947f2c6d40122fecd69ced8a4af92", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.637030826456107, "ground_truth": 0}, {"key": "43144b95b0f947f2c6d40122fecd69ced8a4af92", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.4111108678333892, "ground_truth": 0}, {"key": "58b49fef1d6d2be5211848adc2882b59f043a933", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.18476751751217396, "ground_truth": 0}, {"key": "58b49fef1d6d2be5211848adc2882b59f043a933", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.35756752061892577, "ground_truth": 0}, {"key": "58b49fef1d6d2be5211848adc2882b59f043a933", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.2323101578026314, "ground_truth": 0}, {"key": "58b49fef1d6d2be5211848adc2882b59f043a933", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.11596071604781669, "ground_truth": 0}, {"key": "58b49fef1d6d2be5211848adc2882b59f043a933", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.1980641659305701, "ground_truth": 0}, {"key": "bdcc1253f679b14e54451db44f4f0e39af4bb559", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.5621764939448325, "ground_truth": 0}, {"key": "bdcc1253f679b14e54451db44f4f0e39af4bb559", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.2553436473576383, "ground_truth": 0}, {"key": "bdcc1253f679b14e54451db44f4f0e39af4bb559", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.3611647140076599, "ground_truth": 0}, {"key": "bdcc1253f679b14e54451db44f4f0e39af4bb559", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.3979384078185456, "ground_truth": 0}, {"key": "bdcc1253f679b14e54451db44f4f0e39af4bb559", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.35936412160594106, "ground_truth": 0}, {"key": "b22b1636da5dd15364b6f0c342e4ce4903e51c2a", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.8198933418498556, "ground_truth": 0}, {"key": "b22b1636da5dd15364b6f0c342e4ce4903e51c2a", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.771843502594869, "ground_truth": 0}, {"key": "b22b1636da5dd15364b6f0c342e4ce4903e51c2a", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.8652240720829282, "ground_truth": 0}, {"key": "b22b1636da5dd15364b6f0c342e4ce4903e51c2a", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.7371581371495289, "ground_truth": 0}, {"key": "b22b1636da5dd15364b6f0c342e4ce4903e51c2a", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.5964331579820769, "ground_truth": 0}, {"key": "55986d11e0d0e5b031567157cf1f157610c65c31", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.627951212514862, "ground_truth": 0}, {"key": "55986d11e0d0e5b031567157cf1f157610c65c31", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.665410548591291, "ground_truth": 0}, {"key": "55986d11e0d0e5b031567157cf1f157610c65c31", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.6992544105935173, "ground_truth": 0}, {"key": "55986d11e0d0e5b031567157cf1f157610c65c31", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.8006920230741774, "ground_truth": 0}, {"key": "55986d11e0d0e5b031567157cf1f157610c65c31", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.3923368252383045, "ground_truth": 0}, {"key": "0a37124fe35e31ae9fe8dd7715aeed88002e23e9", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.31405053705952196, "ground_truth": 0}, {"key": "0a37124fe35e31ae9fe8dd7715aeed88002e23e9", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.3886180287371267, "ground_truth": 0}, {"key": "0a37124fe35e31ae9fe8dd7715aeed88002e23e9", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.4263215903941148, "ground_truth": 0}, {"key": "0a37124fe35e31ae9fe8dd7715aeed88002e23e9", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.4016877910131678, "ground_truth": 0}, {"key": "0a37124fe35e31ae9fe8dd7715aeed88002e23e9", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.46879061133269373, "ground_truth": 0}, {"key": "ef3ee3ab85ed8802b6b76444bccb46256077963e", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.3259495283549976, "ground_truth": 0}, {"key": "ef3ee3ab85ed8802b6b76444bccb46256077963e", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.13296424129730788, "ground_truth": 0}, {"key": "ef3ee3ab85ed8802b6b76444bccb46256077963e", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.1366083916304093, "ground_truth": 0}, {"key": "ef3ee3ab85ed8802b6b76444bccb46256077963e", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.25534363629416973, "ground_truth": 0}, {"key": "ef3ee3ab85ed8802b6b76444bccb46256077963e", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.34864512898562056, "ground_truth": 0}, {"key": "fb17ac082bd3f3af3dad8c8d36d9ea56360c520e", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.43206341519960934, "ground_truth": 0}, {"key": "fb17ac082bd3f3af3dad8c8d36d9ea56360c520e", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.18010665124231953, "ground_truth": 0}, {"key": "fb17ac082bd3f3af3dad8c8d36d9ea56360c520e", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.20434188315851484, "ground_truth": 0}, {"key": "fb17ac082bd3f3af3dad8c8d36d9ea56360c520e", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.32766829103655865, "ground_truth": 0}, {"key": "fb17ac082bd3f3af3dad8c8d36d9ea56360c520e", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.4746311716442501, "ground_truth": 0}, {"key": "59f079f6095cbb82b0eaaa0ba5fc29cdaff1f81b", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.21337717032372513, "ground_truth": 0}, {"key": "59f079f6095cbb82b0eaaa0ba5fc29cdaff1f81b", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.31405053287125534, "ground_truth": 0}, {"key": "59f079f6095cbb82b0eaaa0ba5fc29cdaff1f81b", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.5156199035054755, "ground_truth": 0}, {"key": "59f079f6095cbb82b0eaaa0ba5fc29cdaff1f81b", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.2829880890934905, "ground_truth": 0}, {"key": "59f079f6095cbb82b0eaaa0ba5fc29cdaff1f81b", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.18713267980471612, "ground_truth": 0}, {"key": "083bc4309f2ea52be2a378e78566d7dcc9f4dd73", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.5370413923974029, "ground_truth": 0}, {"key": "083bc4309f2ea52be2a378e78566d7dcc9f4dd73", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.583203339297786, "ground_truth": 0}, {"key": "083bc4309f2ea52be2a378e78566d7dcc9f4dd73", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.605799071603823, "ground_truth": 0}, {"key": "083bc4309f2ea52be2a378e78566d7dcc9f4dd73", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.5640984575842266, "ground_truth": 0}, {"key": "083bc4309f2ea52be2a378e78566d7dcc9f4dd73", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.6279512162756427, "ground_truth": 0}, {"key": "ac56bd50e449bfa1d7b923415afa2ae5f7c83392", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.5736784247617474, "ground_truth": 0}, {"key": "ac56bd50e449bfa1d7b923415afa2ae5f7c83392", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.5253688252550639, "ground_truth": 0}, {"key": "ac56bd50e449bfa1d7b923415afa2ae5f7c83392", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.5234203541676169, "ground_truth": 0}, {"key": "ac56bd50e449bfa1d7b923415afa2ae5f7c83392", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.5506073490619428, "ground_truth": 0}, {"key": "ac56bd50e449bfa1d7b923415afa2ae5f7c83392", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.5486735087132898, "ground_truth": 0}, {"key": "61e4747776bd844146a9b8c7c1913c827ffbcd8a", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.9105454024706665, "ground_truth": 0}, {"key": "61e4747776bd844146a9b8c7c1913c827ffbcd8a", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.9053223069505958, "ground_truth": 0}, {"key": "61e4747776bd844146a9b8c7c1913c827ffbcd8a", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.8895288523105174, "ground_truth": 0}, {"key": "61e4747776bd844146a9b8c7c1913c827ffbcd8a", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.8344068904189542, "ground_truth": 0}, {"key": "61e4747776bd844146a9b8c7c1913c827ffbcd8a", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.682573721722953, "ground_truth": 0}, {"key": "a9854fc40719b0d083a3fd279b6196188228a4e0", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.317426242277359, "ground_truth": 0}, {"key": "a9854fc40719b0d083a3fd279b6196188228a4e0", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.40168778337483224, "ground_truth": 0}, {"key": "a9854fc40719b0d083a3fd279b6196188228a4e0", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.47073660100252845, "ground_truth": 0}, {"key": "a9854fc40719b0d083a3fd279b6196188228a4e0", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.5156198937204473, "ground_truth": 0}, {"key": "a9854fc40719b0d083a3fd279b6196188228a4e0", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.3073580059212139, "ground_truth": 0}, {"key": "8d37ab9fcd0248c093f6d0e5682782ebdaf5e837", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.6959583337798146, "ground_truth": 0}, {"key": "8d37ab9fcd0248c093f6d0e5682782ebdaf5e837", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.39047582282256516, "ground_truth": 0}, {"key": "8d37ab9fcd0248c093f6d0e5682782ebdaf5e837", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.5039061838729811, "ground_truth": 0}, {"key": "8d37ab9fcd0248c093f6d0e5682782ebdaf5e837", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.35398631708362305, "ground_truth": 0}, {"key": "8d37ab9fcd0248c093f6d0e5682782ebdaf5e837", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.5660185081867156, "ground_truth": 0}, {"key": "d3199d123dedcdbae55b2e9d1f658717c1d5e233", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.46490156494407275, "ground_truth": 0}, {"key": "d3199d123dedcdbae55b2e9d1f658717c1d5e233", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.3904758370638488, "ground_truth": 0}, {"key": "d3199d123dedcdbae55b2e9d1f658717c1d5e233", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.4843800975488062, "ground_truth": 0}, {"key": "d3199d123dedcdbae55b2e9d1f658717c1d5e233", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.3960681850004039, "ground_truth": 0}, {"key": "d3199d123dedcdbae55b2e9d1f658717c1d5e233", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.5175708684885351, "ground_truth": 0}, {"key": "f249ede5a3cafd2506ff2bb400291a7db1c43b76", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.353986306398159, "ground_truth": 0}, {"key": "f249ede5a3cafd2506ff2bb400291a7db1c43b76", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.28776781112213534, "ground_truth": 0}, {"key": "f249ede5a3cafd2506ff2bb400291a7db1c43b76", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.2704802198765864, "ground_truth": 0}, {"key": "f249ede5a3cafd2506ff2bb400291a7db1c43b76", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.43974734943092614, "ground_truth": 0}, {"key": "f249ede5a3cafd2506ff2bb400291a7db1c43b76", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.3849121251715917, "ground_truth": 0}, {"key": "6343a202a70e8c5d3bfa4042bfd087d78ca5805e", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.348645142672497, "ground_truth": 0}, {"key": "6343a202a70e8c5d3bfa4042bfd087d78ca5805e", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.18832396476634242, "ground_truth": 0}, {"key": "6343a202a70e8c5d3bfa4042bfd087d78ca5805e", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.40356684903096335, "ground_truth": 0}, {"key": "6343a202a70e8c5d3bfa4042bfd087d78ca5805e", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.21206879919577443, "ground_truth": 0}, {"key": "6343a202a70e8c5d3bfa4042bfd087d78ca5805e", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.11596071611975896, "ground_truth": 0}, {"key": "da0d41b431367b51fd995573cb498c10b7f64ca0", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.22678363744291336, "ground_truth": 0}, {"key": "da0d41b431367b51fd995573cb498c10b7f64ca0", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.20817891479149, "ground_truth": 0}, {"key": "da0d41b431367b51fd995573cb498c10b7f64ca0", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.1393963709119195, "ground_truth": 0}, {"key": "da0d41b431367b51fd995573cb498c10b7f64ca0", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.1530421539529296, "ground_truth": 0}, {"key": "da0d41b431367b51fd995573cb498c10b7f64ca0", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.35042136497911314, "ground_truth": 0}, {"key": "0620ff5fa324a35b4be54bbd2de49b42bdd0d7c0", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.27048020729946354, "ground_truth": 0}, {"key": "0620ff5fa324a35b4be54bbd2de49b42bdd0d7c0", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.7325918386910112, "ground_truth": 0}, {"key": "0620ff5fa324a35b4be54bbd2de49b42bdd0d7c0", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.26133093043843386, "ground_truth": 0}, {"key": "0620ff5fa324a35b4be54bbd2de49b42bdd0d7c0", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.18952108072590293, "ground_truth": 0}, {"key": "0620ff5fa324a35b4be54bbd2de49b42bdd0d7c0", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.4707365729356859, "ground_truth": 0}, {"key": "f0eb8f9eee266512eb604a51b482833e202531d8", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.42632161618947895, "ground_truth": 0}, {"key": "f0eb8f9eee266512eb604a51b482833e202531d8", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.5660185610450089, "ground_truth": 0}, {"key": "f0eb8f9eee266512eb604a51b482833e202531d8", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.41111087140740815, "ground_truth": 0}, {"key": "f0eb8f9eee266512eb604a51b482833e202531d8", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.6370307584583831, "ground_truth": 0}, {"key": "f0eb8f9eee266512eb604a51b482833e202531d8", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.5136684615379542, "ground_truth": 0}, {"key": "c8f743307d5d1f7f19f1474d68c9390b22f6d076", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.5389832256750278, "ground_truth": 0}, {"key": "c8f743307d5d1f7f19f1474d68c9390b22f6d076", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.32423539997323436, "ground_truth": 0}, {"key": "c8f743307d5d1f7f19f1474d68c9390b22f6d076", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.5698526312749023, "ground_truth": 0}, {"key": "c8f743307d5d1f7f19f1474d68c9390b22f6d076", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.3415825058728869, "ground_truth": 0}, {"key": "c8f743307d5d1f7f19f1474d68c9390b22f6d076", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.7057850425503014, "ground_truth": 0}, {"key": "5978abfdad91e604840a2dcc993df5ade9448e82", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.6636689364074115, "ground_truth": 0}, {"key": "5978abfdad91e604840a2dcc993df5ade9448e82", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.43398148518780255, "ground_truth": 0}, {"key": "5978abfdad91e604840a2dcc993df5ade9448e82", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.62977461813545, "ground_truth": 0}, {"key": "5978abfdad91e604840a2dcc993df5ade9448e82", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.6076631823217055, "ground_truth": 0}, {"key": "5978abfdad91e604840a2dcc993df5ade9448e82", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.5621765054538471, "ground_truth": 0}, {"key": "5bcd4e61b39cc7ffff38ad88cd40afa208b18528", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.45713670946608687, "ground_truth": 0}, {"key": "5bcd4e61b39cc7ffff38ad88cd40afa208b18528", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.45907613053439417, "ground_truth": 0}, {"key": "5bcd4e61b39cc7ffff38ad88cd40afa208b18528", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.5794004304661751, "ground_truth": 0}, {"key": "5bcd4e61b39cc7ffff38ad88cd40afa208b18528", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.35756750922832614, "ground_truth": 0}, {"key": "5bcd4e61b39cc7ffff38ad88cd40afa208b18528", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.7264256031761713, "ground_truth": 0}, {"key": "44815c184e3013f07781311b30ec5ff009174738", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.2909808605734193, "ground_truth": 0}, {"key": "44815c184e3013f07781311b30ec5ff009174738", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.35936414936864225, "ground_truth": 0}, {"key": "44815c184e3013f07781311b30ec5ff009174738", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.4455295424835397, "ground_truth": 0}, {"key": "44815c184e3013f07781311b30ec5ff009174738", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.3380771367553729, "ground_truth": 0}, {"key": "44815c184e3013f07781311b30ec5ff009174738", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.361164716495961, "ground_truth": 0}, {"key": "d7783bd2bf5ad92156962380342411c2eb068853", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.49414089990576154, "ground_truth": 0}, {"key": "d7783bd2bf5ad92156962380342411c2eb068853", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.6876300030586155, "ground_truth": 0}, {"key": "d7783bd2bf5ad92156962380342411c2eb068853", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.5175709038114057, "ground_truth": 0}, {"key": "d7783bd2bf5ad92156962380342411c2eb068853", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.47657963048457996, "ground_truth": 0}, {"key": "d7783bd2bf5ad92156962380342411c2eb068853", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.4843800785046206, "ground_truth": 0}, {"key": "4963edb0ad2703e9f6c54593149d9b81e7ada91f", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.22541663085600713, "ground_truth": 0}, {"key": "4963edb0ad2703e9f6c54593149d9b81e7ada91f", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.2479874214747305, "ground_truth": 0}, {"key": "4963edb0ad2703e9f6c54593149d9b81e7ada91f", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.33982762934410055, "ground_truth": 0}, {"key": "4963edb0ad2703e9f6c54593149d9b81e7ada91f", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.12336563043103037, "ground_truth": 0}, {"key": "4963edb0ad2703e9f6c54593149d9b81e7ada91f", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.28298812417470076, "ground_truth": 0}, {"key": "51b9a2d46dac43952e713874a5769be5ae350626", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.626124165753368, "ground_truth": 0}, {"key": "51b9a2d46dac43952e713874a5769be5ae350626", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.3311197113909862, "ground_truth": 0}, {"key": "51b9a2d46dac43952e713874a5769be5ae350626", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.25832598349449853, "ground_truth": 0}, {"key": "51b9a2d46dac43952e713874a5769be5ae350626", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.16132022195071136, "ground_truth": 0}, {"key": "51b9a2d46dac43952e713874a5769be5ae350626", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.21206880755559793, "ground_truth": 0}, {"key": "d670da295571f998bd0864540e2acd109d077131", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.5175708941121601, "ground_truth": 0}, {"key": "d670da295571f998bd0864540e2acd109d077131", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.30074558767394244, "ground_truth": 0}, {"key": "d670da295571f998bd0864540e2acd109d077131", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.4320633899137283, "ground_truth": 0}, {"key": "d670da295571f998bd0864540e2acd109d077131", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.3998116638171999, "ground_truth": 0}, {"key": "d670da295571f998bd0864540e2acd109d077131", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.5869964512750544, "ground_truth": 0}, {"key": "f2f2246150d06734b2fab694a39bd8d693c7d255", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.5640984853655792, "ground_truth": 0}, {"key": "f2f2246150d06734b2fab694a39bd8d693c7d255", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.3849121540840007, "ground_truth": 0}, {"key": "f2f2246150d06734b2fab694a39bd8d693c7d255", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.5234203186576739, "ground_truth": 0}, {"key": "f2f2246150d06734b2fab694a39bd8d693c7d255", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.5117166014571956, "ground_truth": 0}, {"key": "f2f2246150d06734b2fab694a39bd8d693c7d255", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.37937837984392947, "ground_truth": 0}, {"key": "3cc0409612242093f34ea1d8ca1679f434955cff", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.23792989344047163, "ground_truth": 0}, {"key": "3cc0409612242093f34ea1d8ca1679f434955cff", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.27512972854851947, "ground_truth": 0}, {"key": "3cc0409612242093f34ea1d8ca1679f434955cff", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.14033624220486898, "ground_truth": 0}, {"key": "3cc0409612242093f34ea1d8ca1679f434955cff", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.1634454294149328, "ground_truth": 0}, {"key": "3cc0409612242093f34ea1d8ca1679f434955cff", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.6334102675834241, "ground_truth": 0}, {"key": "a67c4eaf797da7df18a715cd30c6cf11db96c954", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.31912136851796014, "ground_truth": 0}, {"key": "a67c4eaf797da7df18a715cd30c6cf11db96c954", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.3720487834307181, "ground_truth": 0}, {"key": "a67c4eaf797da7df18a715cd30c6cf11db96c954", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.21866938731007554, "ground_truth": 0}, {"key": "a67c4eaf797da7df18a715cd30c6cf11db96c954", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.3923368159849543, "ground_truth": 0}, {"key": "a67c4eaf797da7df18a715cd30c6cf11db96c954", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.21076629879708828, "ground_truth": 0}, {"key": "58456413c8bd03a8ce70eb0061af07c6a9824fc3", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.2735743903192267, "ground_truth": 0}, {"key": "58456413c8bd03a8ce70eb0061af07c6a9824fc3", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.34510529487881103, "ground_truth": 0}, {"key": "58456413c8bd03a8ce70eb0061af07c6a9824fc3", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.4804786727055529, "ground_truth": 0}, {"key": "58456413c8bd03a8ce70eb0061af07c6a9824fc3", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.2598256199358424, "ground_truth": 0}, {"key": "58456413c8bd03a8ce70eb0061af07c6a9824fc3", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.27357440515212134, "ground_truth": 0}, {"key": "da040b67082b56436ccc8479a4e435cbf892a1f2", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.07263670893796932, "ground_truth": 0}, {"key": "da040b67082b56436ccc8479a4e435cbf892a1f2", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.10447732355910944, "ground_truth": 0}, {"key": "da040b67082b56436ccc8479a4e435cbf892a1f2", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.14318769511915858, "ground_truth": 0}, {"key": "da040b67082b56436ccc8479a4e435cbf892a1f2", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.09401018222144893, "ground_truth": 0}, {"key": "da040b67082b56436ccc8479a4e435cbf892a1f2", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.13206614673749034, "ground_truth": 0}, {"key": "c71748bb246a2b05e676862b75b38fa03bf6646e", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.17106117171053356, "ground_truth": 0}, {"key": "c71748bb246a2b05e676862b75b38fa03bf6646e", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.10302442303763822, "ground_truth": 0}, {"key": "c71748bb246a2b05e676862b75b38fa03bf6646e", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.07369626343270491, "ground_truth": 0}, {"key": "c71748bb246a2b05e676862b75b38fa03bf6646e", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.14511536079728585, "ground_truth": 0}, {"key": "c71748bb246a2b05e676862b75b38fa03bf6646e", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.2160115136348043, "ground_truth": 0}, {"key": "800f8dc06596c30444526bf31dd0db7504391a82", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.611381971400555, "ground_truth": 0}, {"key": "800f8dc06596c30444526bf31dd0db7504391a82", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.8164063927165814, "ground_truth": 0}, {"key": "800f8dc06596c30444526bf31dd0db7504391a82", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.48828338058234183, "ground_truth": 0}, {"key": "800f8dc06596c30444526bf31dd0db7504391a82", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.7025300634878056, "ground_truth": 0}, {"key": "800f8dc06596c30444526bf31dd0db7504391a82", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.6859494469004329, "ground_truth": 0}, {"key": "3b0ed227dc7e5292e302183282d8bbe23d7b1db2", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.21076629952124895, "ground_truth": 0}, {"key": "3b0ed227dc7e5292e302183282d8bbe23d7b1db2", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.30074559776750126, "ground_truth": 0}, {"key": "3b0ed227dc7e5292e302183282d8bbe23d7b1db2", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.2160115333579809, "ground_truth": 0}, {"key": "3b0ed227dc7e5292e302183282d8bbe23d7b1db2", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.19193278226923313, "ground_truth": 0}, {"key": "3b0ed227dc7e5292e302183282d8bbe23d7b1db2", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.18594719464569878, "ground_truth": 0}, {"key": "1e713005e16983f75222235967c0cbeb0b944f80", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.3007455635989046, "ground_truth": 0}, {"key": "1e713005e16983f75222235967c0cbeb0b944f80", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.37204879167776345, "ground_truth": 0}, {"key": "1e713005e16983f75222235967c0cbeb0b944f80", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.45713671316330134, "ground_truth": 0}, {"key": "1e713005e16983f75222235967c0cbeb0b944f80", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.23792989241251136, "ground_truth": 0}, {"key": "1e713005e16983f75222235967c0cbeb0b944f80", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.3557748755155251, "ground_truth": 0}, {"key": "360ae10bc8bd30a2aca7bc6b7000e138af63adb1", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.5964331561644716, "ground_truth": 0}, {"key": "360ae10bc8bd30a2aca7bc6b7000e138af63adb1", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.859663752654948, "ground_truth": 0}, {"key": "360ae10bc8bd30a2aca7bc6b7000e138af63adb1", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.7866228353246688, "ground_truth": 0}, {"key": "360ae10bc8bd30a2aca7bc6b7000e138af63adb1", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.5736783972458049, "ground_truth": 0}, {"key": "360ae10bc8bd30a2aca7bc6b7000e138af63adb1", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.9304582540977139, "ground_truth": 0}, {"key": "50e996059a005d15e3e89b5a3c3695309671ed34", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.34687308808409134, "ground_truth": 0}, {"key": "50e996059a005d15e3e89b5a3c3695309671ed34", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.4054487303021108, "ground_truth": 0}, {"key": "50e996059a005d15e3e89b5a3c3695309671ed34", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.6584175105753249, "ground_truth": 0}, {"key": "50e996059a005d15e3e89b5a3c3695309671ed34", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.6057990157200326, "ground_truth": 0}, {"key": "50e996059a005d15e3e89b5a3c3695309671ed34", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.4843801167895166, "ground_truth": 0}, {"key": "ccc7f6a2139593c47f6b5880f1e3eef9e7a69734", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.10669058945920157, "ground_truth": 0}, {"key": "ccc7f6a2139593c47f6b5880f1e3eef9e7a69734", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.2068940474364736, "ground_truth": 0}, {"key": "ccc7f6a2139593c47f6b5880f1e3eef9e7a69734", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.2337063598725962, "ground_truth": 0}, {"key": "ccc7f6a2139593c47f6b5880f1e3eef9e7a69734", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.1634454386411498, "ground_truth": 0}, {"key": "ccc7f6a2139593c47f6b5880f1e3eef9e7a69734", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.2751297304975827, "ground_truth": 0}, {"key": "f4f90d4ff5af3e3648055673e040f0f43ae076d2", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.38491212380221995, "ground_truth": 0}, {"key": "f4f90d4ff5af3e3648055673e040f0f43ae076d2", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.3793783708061175, "ground_truth": 0}, {"key": "f4f90d4ff5af3e3648055673e040f0f43ae076d2", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.40356685201758846, "ground_truth": 0}, {"key": "f4f90d4ff5af3e3648055673e040f0f43ae076d2", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.21206881208927184, "ground_truth": 0}, {"key": "f4f90d4ff5af3e3648055673e040f0f43ae076d2", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.2658804914822908, "ground_truth": 0}, {"key": "6c9ec6b9d3e936d2394f74354d577fdfcdd985a3", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.22541661266013224, "ground_truth": 0}, {"key": "6c9ec6b9d3e936d2394f74354d577fdfcdd985a3", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.14414885306274677, "ground_truth": 0}, {"key": "6c9ec6b9d3e936d2394f74354d577fdfcdd985a3", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.14318770262752126, "ground_truth": 0}, {"key": "6c9ec6b9d3e936d2394f74354d577fdfcdd985a3", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.12765261720913787, "ground_truth": 0}, {"key": "6c9ec6b9d3e936d2394f74354d577fdfcdd985a3", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.5964331422954502, "ground_truth": 0}, {"key": "438a2046f4465fb1f6dab1cb327ef9ca86a4cc0d", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.42059957051048263, "ground_truth": 0}, {"key": "438a2046f4465fb1f6dab1cb327ef9ca86a4cc0d", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.5794003940307653, "ground_truth": 0}, {"key": "438a2046f4465fb1f6dab1cb327ef9ca86a4cc0d", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.30074555157556376, "ground_truth": 0}, {"key": "438a2046f4465fb1f6dab1cb327ef9ca86a4cc0d", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.40168781538823023, "ground_truth": 0}, {"key": "438a2046f4465fb1f6dab1cb327ef9ca86a4cc0d", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.3208213076433102, "ground_truth": 0}, {"key": "73818f6c987b3604b8bc92c4fb03bc68af196b77", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.0574932731729829, "ground_truth": 0}, {"key": "73818f6c987b3604b8bc92c4fb03bc68af196b77", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.2766905272315656, "ground_truth": 0}, {"key": "73818f6c987b3604b8bc92c4fb03bc68af196b77", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.12336561665476468, "ground_truth": 0}, {"key": "73818f6c987b3604b8bc92c4fb03bc68af196b77", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.2720245586361388, "ground_truth": 0}, {"key": "73818f6c987b3604b8bc92c4fb03bc68af196b77", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.33982762500539193, "ground_truth": 0}, {"key": "f06d91f46326752b02cdc48e8fa472dcc38a0846", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.13939637595698218, "ground_truth": 0}, {"key": "f06d91f46326752b02cdc48e8fa472dcc38a0846", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.1766715889222939, "ground_truth": 0}, {"key": "f06d91f46326752b02cdc48e8fa472dcc38a0846", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.20561504360311594, "ground_truth": 0}, {"key": "f06d91f46326752b02cdc48e8fa472dcc38a0846", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.21076629361237859, "ground_truth": 0}, {"key": "f06d91f46326752b02cdc48e8fa472dcc38a0846", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.2365162328731001, "ground_truth": 0}, {"key": "c54bee6384d58517757ad5a8a30ea6dc59980a07", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.10017222496616421, "ground_truth": 0}, {"key": "c54bee6384d58517757ad5a8a30ea6dc59980a07", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.18713266846826263, "ground_truth": 0}, {"key": "c54bee6384d58517757ad5a8a30ea6dc59980a07", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.23231014581048187, "ground_truth": 0}, {"key": "c54bee6384d58517757ad5a8a30ea6dc59980a07", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.14128141927362417, "ground_truth": 0}, {"key": "c54bee6384d58517757ad5a8a30ea6dc59980a07", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.37937836853128376, "ground_truth": 0}, {"key": "2757ff294ae08e977ed6a2b6e1854210f28f12c9", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.21206880479991824, "ground_truth": 0}, {"key": "2757ff294ae08e977ed6a2b6e1854210f28f12c9", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.11596071685769095, "ground_truth": 0}, {"key": "2757ff294ae08e977ed6a2b6e1854210f28f12c9", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.1755380688653756, "ground_truth": 0}, {"key": "2757ff294ae08e977ed6a2b6e1854210f28f12c9", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.10894505145862683, "ground_truth": 0}, {"key": "2757ff294ae08e977ed6a2b6e1854210f28f12c9", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.150028816031111, "ground_truth": 0}, {"key": "6a004c991c482f664ab8ac78df0bda26860b1c7a", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.23091976261027047, "ground_truth": 0}, {"key": "6a004c991c482f664ab8ac78df0bda26860b1c7a", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.2583259950524927, "ground_truth": 0}, {"key": "6a004c991c482f664ab8ac78df0bda26860b1c7a", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.19559408177502308, "ground_truth": 0}, {"key": "6a004c991c482f664ab8ac78df0bda26860b1c7a", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.21076629971038455, "ground_truth": 0}, {"key": "6a004c991c482f664ab8ac78df0bda26860b1c7a", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.1480471924308022, "ground_truth": 0}, {"key": "69159eadf4dcb2b7850f3a4db6454f8209f33e3a", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.44746028529094206, "ground_truth": 0}, {"key": "69159eadf4dcb2b7850f3a4db6454f8209f33e3a", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.7549149744940084, "ground_truth": 0}, {"key": "69159eadf4dcb2b7850f3a4db6454f8209f33e3a", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.55832700082169, "ground_truth": 0}, {"key": "69159eadf4dcb2b7850f3a4db6454f8209f33e3a", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.4244119899263149, "ground_truth": 0}, {"key": "69159eadf4dcb2b7850f3a4db6454f8209f33e3a", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.6095241642873352, "ground_truth": 0}, {"key": "c6129a4c1fbd5680f512da18fb60a19a74f4959e", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.8031737892441734, "ground_truth": 0}, {"key": "c6129a4c1fbd5680f512da18fb60a19a74f4959e", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.7122321867070887, "ground_truth": 0}, {"key": "c6129a4c1fbd5680f512da18fb60a19a74f4959e", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.4416729988120205, "ground_truth": 0}, {"key": "c6129a4c1fbd5680f512da18fb60a19a74f4959e", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.6370307992752705, "ground_truth": 0}, {"key": "c6129a4c1fbd5680f512da18fb60a19a74f4959e", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.45907615755330083, "ground_truth": 0}, {"key": "1fe7d16db2c7a742dc1bcf04bfb8e285e7909f03", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.637030799789591, "ground_truth": 0}, {"key": "1fe7d16db2c7a742dc1bcf04bfb8e285e7909f03", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.4148988187980936, "ground_truth": 0}, {"key": "1fe7d16db2c7a742dc1bcf04bfb8e285e7909f03", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.3557749206090261, "ground_truth": 0}, {"key": "1fe7d16db2c7a742dc1bcf04bfb8e285e7909f03", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.2782567905284443, "ground_truth": 0}, {"key": "1fe7d16db2c7a742dc1bcf04bfb8e285e7909f03", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.33458942674681036, "ground_truth": 0}, {"key": "e0ddf766661004eb3ff337d95e249073410f0755", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.8140527915833613, "ground_truth": 0}, {"key": "e0ddf766661004eb3ff337d95e249073410f0755", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.8221891085001659, "ground_truth": 0}, {"key": "e0ddf766661004eb3ff337d95e249073410f0755", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.7008947882972506, "ground_truth": 0}, {"key": "e0ddf766661004eb3ff337d95e249073410f0755", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.5679366135204009, "ground_truth": 0}, {"key": "e0ddf766661004eb3ff337d95e249073410f0755", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.6531269208086987, "ground_truth": 0}, {"key": "dd37d70b837b24247e9abafe8fb5bc5fae5de464", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.2254166356228473, "ground_truth": 0}, {"key": "dd37d70b837b24247e9abafe8fb5bc5fae5de464", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.6206216012068877, "ground_truth": 0}, {"key": "dd37d70b837b24247e9abafe8fb5bc5fae5de464", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.06705628614311249, "ground_truth": 0}, {"key": "dd37d70b837b24247e9abafe8fb5bc5fae5de464", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.21469141162452368, "ground_truth": 0}, {"key": "dd37d70b837b24247e9abafe8fb5bc5fae5de464", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.5292633836685892, "ground_truth": 0}, {"key": "6e3028e9ae17ab59abc7732fe840468ac9dcb60c", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.19193280329970777, "ground_truth": 0}, {"key": "6e3028e9ae17ab59abc7732fe840468ac9dcb60c", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.18832396975152668, "ground_truth": 0}, {"key": "6e3028e9ae17ab59abc7732fe840468ac9dcb60c", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.20817893376331026, "ground_truth": 0}, {"key": "6e3028e9ae17ab59abc7732fe840468ac9dcb60c", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.16995624107660348, "ground_truth": 0}, {"key": "6e3028e9ae17ab59abc7732fe840468ac9dcb60c", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.2523840540031551, "ground_truth": 0}, {"key": "24d2f15f65bfb5608c75d19ba07fc410aab4d9c6", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.804405937135128, "ground_truth": 0}, {"key": "24d2f15f65bfb5608c75d19ba07fc410aab4d9c6", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.46684557902408214, "ground_truth": 0}, {"key": "24d2f15f65bfb5608c75d19ba07fc410aab4d9c6", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.824461927012408, "ground_truth": 0}, {"key": "24d2f15f65bfb5608c75d19ba07fc410aab4d9c6", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.6057990415122383, "ground_truth": 0}, {"key": "24d2f15f65bfb5608c75d19ba07fc410aab4d9c6", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.5774953782344635, "ground_truth": 0}, {"key": "698329cc7a8d796d7635bf59d2435aa22c1a38e6", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.27669054881864125, "ground_truth": 0}, {"key": "698329cc7a8d796d7635bf59d2435aa22c1a38e6", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.2735743910641433, "ground_truth": 0}, {"key": "698329cc7a8d796d7635bf59d2435aa22c1a38e6", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.4225046214933339, "ground_truth": 0}, {"key": "698329cc7a8d796d7635bf59d2435aa22c1a38e6", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.4263215978267631, "ground_truth": 0}, {"key": "698329cc7a8d796d7635bf59d2435aa22c1a38e6", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.23510836272284794, "ground_truth": 0}, {"key": "b531a8ba685e8d461d0a491f35c9970c3dddf3dd", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.5544704678445661, "ground_truth": 0}, {"key": "b531a8ba685e8d461d0a491f35c9970c3dddf3dd", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.5983121847077751, "ground_truth": 0}, {"key": "b531a8ba685e8d461d0a491f35c9970c3dddf3dd", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.5583270135506146, "ground_truth": 0}, {"key": "b531a8ba685e8d461d0a491f35c9970c3dddf3dd", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.46879061334089, "ground_truth": 0}, {"key": "b531a8ba685e8d461d0a491f35c9970c3dddf3dd", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.5926666091329919, "ground_truth": 0}, {"key": "5b0e686b4679910743337ce02b36dd71a5caf5eb", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.1919327682456536, "ground_truth": 0}, {"key": "5b0e686b4679910743337ce02b36dd71a5caf5eb", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.25683197909965244, "ground_truth": 0}, {"key": "5b0e686b4679910743337ce02b36dd71a5caf5eb", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.23792990031182573, "ground_truth": 0}, {"key": "5b0e686b4679910743337ce02b36dd71a5caf5eb", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.1285251354628306, "ground_truth": 0}, {"key": "5b0e686b4679910743337ce02b36dd71a5caf5eb", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.08269733720062192, "ground_truth": 0}, {"key": "980e6db610d9882443d61e36d955f02d983d3e76", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.5869964451046409, "ground_truth": 0}, {"key": "980e6db610d9882443d61e36d955f02d983d3e76", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.7325918488643957, "ground_truth": 0}, {"key": "980e6db610d9882443d61e36d955f02d983d3e76", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.40544870483643797, "ground_truth": 0}, {"key": "980e6db610d9882443d61e36d955f02d983d3e76", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.3775406865327196, "ground_truth": 0}, {"key": "980e6db610d9882443d61e36d955f02d983d3e76", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.6315943254561641, "ground_truth": 0}, {"key": "6c18984d8f30ce196e9399200dd15e373e699267", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.697608926684909, "ground_truth": 0}, {"key": "6c18984d8f30ce196e9399200dd15e373e699267", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.2583260067110388, "ground_truth": 0}, {"key": "6c18984d8f30ce196e9399200dd15e373e699267", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.3998116361898944, "ground_truth": 0}, {"key": "6c18984d8f30ce196e9399200dd15e373e699267", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.6774740216275414, "ground_truth": 0}, {"key": "6c18984d8f30ce196e9399200dd15e373e699267", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.2893717144325565, "ground_truth": 0}, {"key": "e00f05efe2038fffc8eaa1e8eecbe9445a9483e5", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.3575675457751967, "ground_truth": 0}, {"key": "e00f05efe2038fffc8eaa1e8eecbe9445a9483e5", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.38491214488756476, "ground_truth": 0}, {"key": "e00f05efe2038fffc8eaa1e8eecbe9445a9483e5", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.3242353851846889, "ground_truth": 0}, {"key": "e00f05efe2038fffc8eaa1e8eecbe9445a9483e5", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.25982561076910465, "ground_truth": 0}, {"key": "e00f05efe2038fffc8eaa1e8eecbe9445a9483e5", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.4339814613334347, "ground_truth": 0}, {"key": "9ce109dc50fe4eca8b2d0c926d5dbd1df5f49187", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.049589021826815835, "ground_truth": 0}, {"key": "9ce109dc50fe4eca8b2d0c926d5dbd1df5f49187", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.4359015291780784, "ground_truth": 0}, {"key": "9ce109dc50fe4eca8b2d0c926d5dbd1df5f49187", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.1602660254261761, "ground_truth": 0}, {"key": "9ce109dc50fe4eca8b2d0c926d5dbd1df5f49187", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.21337717787756416, "ground_truth": 0}, {"key": "9ce109dc50fe4eca8b2d0c926d5dbd1df5f49187", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.27048018875773905, "ground_truth": 0}, {"key": "bbec538b4453859ee9c772c4de8f0eb28acd87c4", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.44360043302532076, "ground_truth": 0}, {"key": "bbec538b4453859ee9c772c4de8f0eb28acd87c4", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.4186969199139804, "ground_truth": 0}, {"key": "bbec538b4453859ee9c772c4de8f0eb28acd87c4", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.43206337510237136, "ground_truth": 0}, {"key": "bbec538b4453859ee9c772c4de8f0eb28acd87c4", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.2958398596462475, "ground_truth": 0}, {"key": "bbec538b4453859ee9c772c4de8f0eb28acd87c4", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.5273165165678579, "ground_truth": 0}, {"key": "c4e0587d1b8fcc06c2cc5cfcec42a34d314fbe44", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.24653334125881882, "ground_truth": 0}, {"key": "c4e0587d1b8fcc06c2cc5cfcec42a34d314fbe44", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.1847675052744079, "ground_truth": 0}, {"key": "c4e0587d1b8fcc06c2cc5cfcec42a34d314fbe44", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.4282334056533666, "ground_truth": 0}, {"key": "c4e0587d1b8fcc06c2cc5cfcec42a34d314fbe44", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.4571367136463731, "ground_truth": 0}, {"key": "c4e0587d1b8fcc06c2cc5cfcec42a34d314fbe44", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.5214711345211135, "ground_truth": 0}, {"key": "7eaaa5bfe35344ee85eeb871a4d31cd31b12965b", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.38861806934821813, "ground_truth": 0}, {"key": "7eaaa5bfe35344ee85eeb871a4d31cd31b12965b", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.384912182262374, "ground_truth": 0}, {"key": "7eaaa5bfe35344ee85eeb871a4d31cd31b12965b", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.3539862760764058, "ground_truth": 0}, {"key": "7eaaa5bfe35344ee85eeb871a4d31cd31b12965b", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.2643583434620248, "ground_truth": 0}, {"key": "7eaaa5bfe35344ee85eeb871a4d31cd31b12965b", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.2735744049590396, "ground_truth": 0}, {"key": "9cce7373a54faccf5b5d1232c82afab9b29ab6b9", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.4148988436637417, "ground_truth": 0}, {"key": "9cce7373a54faccf5b5d1232c82afab9b29ab6b9", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.771843520967642, "ground_truth": 0}, {"key": "9cce7373a54faccf5b5d1232c82afab9b29ab6b9", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.7170118651115449, "ground_truth": 0}, {"key": "9cce7373a54faccf5b5d1232c82afab9b29ab6b9", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.36477753605628144, "ground_truth": 0}, {"key": "9cce7373a54faccf5b5d1232c82afab9b29ab6b9", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.6297746188137293, "ground_truth": 0}, {"key": "1b37e549bbcec859711e5b2ef310e94deed4dc95", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.8864203941008294, "ground_truth": 0}, {"key": "1b37e549bbcec859711e5b2ef310e94deed4dc95", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.44167301644023405, "ground_truth": 0}, {"key": "1b37e549bbcec859711e5b2ef310e94deed4dc95", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.39420096416735545, "ground_truth": 0}, {"key": "1b37e549bbcec859711e5b2ef310e94deed4dc95", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.40544873259230557, "ground_truth": 0}, {"key": "1b37e549bbcec859711e5b2ef310e94deed4dc95", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.675764599819336, "ground_truth": 0}, {"key": "da780ee614304d195bde3b7549313c02990d072e", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.3942009506562441, "ground_truth": 0}, {"key": "da780ee614304d195bde3b7549313c02990d072e", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.5273165153332771, "ground_truth": 0}, {"key": "da780ee614304d195bde3b7549313c02990d072e", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.49023562564190276, "ground_truth": 0}, {"key": "da780ee614304d195bde3b7549313c02990d072e", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.5640984745510588, "ground_truth": 0}, {"key": "da780ee614304d195bde3b7549313c02990d072e", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.6531269019758942, "ground_truth": 0}, {"key": "e24cdc200182d698a34f564ba71f4948ce6760e5", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.276690519284588, "ground_truth": 0}, {"key": "e24cdc200182d698a34f564ba71f4948ce6760e5", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.3293917338018114, "ground_truth": 0}, {"key": "e24cdc200182d698a34f564ba71f4948ce6760e5", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.20434188888214894, "ground_truth": 0}, {"key": "e24cdc200182d698a34f564ba71f4948ce6760e5", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.22000711156286387, "ground_truth": 0}, {"key": "e24cdc200182d698a34f564ba71f4948ce6760e5", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.2365162424978016, "ground_truth": 0}, {"key": "42483672c204aebcf7ba6e7d6ca4c628fe9a69e7", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.29910517732937286, "ground_truth": 0}, {"key": "42483672c204aebcf7ba6e7d6ca4c628fe9a69e7", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.17667159877845043, "ground_truth": 0}, {"key": "42483672c204aebcf7ba6e7d6ca4c628fe9a69e7", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.6723317076504689, "ground_truth": 0}, {"key": "42483672c204aebcf7ba6e7d6ca4c628fe9a69e7", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.3106943762181921, "ground_truth": 0}, {"key": "42483672c204aebcf7ba6e7d6ca4c628fe9a69e7", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.3812195708158443, "ground_truth": 0}, {"key": "3501c83d3dab4a2e4d2142522a4bf1510a64422a", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.09268777622980497, "ground_truth": 0}, {"key": "3501c83d3dab4a2e4d2142522a4bf1510a64422a", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.14318767842156582, "ground_truth": 0}, {"key": "3501c83d3dab4a2e4d2142522a4bf1510a64422a", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.14706452349654323, "ground_truth": 0}, {"key": "3501c83d3dab4a2e4d2142522a4bf1510a64422a", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.08210662278310317, "ground_truth": 0}, {"key": "3501c83d3dab4a2e4d2142522a4bf1510a64422a", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.0850990405567292, "ground_truth": 0}, {"key": "964589248c2d95ac3c734ad71283ca22ae4ecedf", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.41679664010602246, "ground_truth": 0}, {"key": "964589248c2d95ac3c734ad71283ca22ae4ecedf", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.5869964539202884, "ground_truth": 0}, {"key": "964589248c2d95ac3c734ad71283ca22ae4ecedf", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.29746996453548064, "ground_truth": 0}, {"key": "964589248c2d95ac3c734ad71283ca22ae4ecedf", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.36658971283685765, "ground_truth": 0}, {"key": "964589248c2d95ac3c734ad71283ca22ae4ecedf", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.602061589105953, "ground_truth": 0}, {"key": "6b72550a663bcb7a64e242ede6da53b1f585ea71", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.4726834798841842, "ground_truth": 0}, {"key": "6b72550a663bcb7a64e242ede6da53b1f585ea71", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.7386690873244736, "ground_truth": 0}, {"key": "6b72550a663bcb7a64e242ede6da53b1f585ea71", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.7248702788283915, "ground_truth": 0}, {"key": "6b72550a663bcb7a64e242ede6da53b1f585ea71", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.6460136799460016, "ground_truth": 0}, {"key": "6b72550a663bcb7a64e242ede6da53b1f585ea71", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.7401743479287787, "ground_truth": 0}, {"key": "c96bdfc0463d994ddc858ad358fe59371be79352", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.15921740503606138, "ground_truth": 0}, {"key": "c96bdfc0463d994ddc858ad358fe59371be79352", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.4186969002264359, "ground_truth": 0}, {"key": "c96bdfc0463d994ddc858ad358fe59371be79352", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.37570644919156876, "ground_truth": 0}, {"key": "c96bdfc0463d994ddc858ad358fe59371be79352", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.16344542820770797, "ground_truth": 0}, {"key": "c96bdfc0463d994ddc858ad358fe59371be79352", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.6601723869337619, "ground_truth": 0}, {"key": "085dc5d706487da983655043b144952956cb3c5b", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.33807712465474354, "ground_truth": 0}, {"key": "085dc5d706487da983655043b144952956cb3c5b", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.27669053904522495, "ground_truth": 0}, {"key": "085dc5d706487da983655043b144952956cb3c5b", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.3684057070232653, "ground_truth": 0}, {"key": "085dc5d706487da983655043b144952956cb3c5b", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.25982564071409314, "ground_truth": 0}, {"key": "085dc5d706487da983655043b144952956cb3c5b", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.5078118459753765, "ground_truth": 0}, {"key": "1c1dc1da2f6ba045478e25e91c8e1b039ce4cc67", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.754914975038911, "ground_truth": 0}, {"key": "1c1dc1da2f6ba045478e25e91c8e1b039ce4cc67", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.694302663778868, "ground_truth": 0}, {"key": "1c1dc1da2f6ba045478e25e91c8e1b039ce4cc67", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.5717665955846076, "ground_truth": 0}, {"key": "1c1dc1da2f6ba045478e25e91c8e1b039ce4cc67", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.5679366242096463, "ground_truth": 0}, {"key": "1c1dc1da2f6ba045478e25e91c8e1b039ce4cc67", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.6548947338664335, "ground_truth": 0}, {"key": "da90eb668bfc66a5e70b2e6631a5ec1c9ffb2413", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.47073660501092435, "ground_truth": 0}, {"key": "da90eb668bfc66a5e70b2e6631a5ec1c9ffb2413", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.2538609949967939, "ground_truth": 0}, {"key": "da90eb668bfc66a5e70b2e6631a5ec1c9ffb2413", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.32594950075989776, "ground_truth": 0}, {"key": "da90eb668bfc66a5e70b2e6631a5ec1c9ffb2413", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.6388352756258141, "ground_truth": 0}, {"key": "da90eb668bfc66a5e70b2e6631a5ec1c9ffb2413", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.6224593552671934, "ground_truth": 0}, {"key": "717b1934db9eb0d7e5e2aef75cd54b29a6530a59", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.14608725264052477, "ground_truth": 0}, {"key": "717b1934db9eb0d7e5e2aef75cd54b29a6530a59", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.25386100675356127, "ground_truth": 0}, {"key": "717b1934db9eb0d7e5e2aef75cd54b29a6530a59", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.17553807355963197, "ground_truth": 0}, {"key": "717b1934db9eb0d7e5e2aef75cd54b29a6530a59", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.24653334966861123, "ground_truth": 0}, {"key": "717b1934db9eb0d7e5e2aef75cd54b29a6530a59", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.2538610170288096, "ground_truth": 0}, {"key": "e493fe7f282adb10c6b9af18d41f0181f17341e5", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.12852513583923225, "ground_truth": 0}, {"key": "e493fe7f282adb10c6b9af18d41f0181f17341e5", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.12168575573550053, "ground_truth": 0}, {"key": "e493fe7f282adb10c6b9af18d41f0181f17341e5", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.19072403035529903, "ground_truth": 0}, {"key": "e493fe7f282adb10c6b9af18d41f0181f17341e5", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.23091975292921318, "ground_truth": 0}, {"key": "e493fe7f282adb10c6b9af18d41f0181f17341e5", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.343341756506494, "ground_truth": 0}, {"key": "e510fc72b8ef595e45f1a510d0cad761ae1bd032", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.3056973566096807, "ground_truth": 0}, {"key": "e510fc72b8ef595e45f1a510d0cad761ae1bd032", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.5214711289411028, "ground_truth": 0}, {"key": "e510fc72b8ef595e45f1a510d0cad761ae1bd032", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.4785288461427458, "ground_truth": 0}, {"key": "e510fc72b8ef595e45f1a510d0cad761ae1bd032", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.25238406871051605, "ground_truth": 0}, {"key": "e510fc72b8ef595e45f1a510d0cad761ae1bd032", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.4225046192102505, "ground_truth": 0}, {"key": "564e02cb944ea00c02f9832ab968441b5c67332e", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.4687906407014861, "ground_truth": 0}, {"key": "564e02cb944ea00c02f9832ab968441b5c67332e", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.4629586114174302, "ground_truth": 0}, {"key": "564e02cb944ea00c02f9832ab968441b5c67332e", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.4073334071073159, "ground_truth": 0}, {"key": "564e02cb944ea00c02f9832ab968441b5c67332e", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.4707365860067359, "ground_truth": 0}, {"key": "564e02cb944ea00c02f9832ab968441b5c67332e", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.44360042346401873, "ground_truth": 0}, {"key": "dfd0cea6589cb8be40538b9f165781fbc2c7d796", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.28298810869309454, "ground_truth": 0}, {"key": "dfd0cea6589cb8be40538b9f165781fbc2c7d796", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.4707366044227487, "ground_truth": 0}, {"key": "dfd0cea6589cb8be40538b9f165781fbc2c7d796", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.3593641453591469, "ground_truth": 0}, {"key": "dfd0cea6589cb8be40538b9f165781fbc2c7d796", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.3023910738833326, "ground_truth": 0}, {"key": "dfd0cea6589cb8be40538b9f165781fbc2c7d796", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.27669052536539274, "ground_truth": 0}, {"key": "dbceded6ea7d8a0944ab3f44263f688f644a5c37", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.307357995724551, "ground_truth": 0}, {"key": "dbceded6ea7d8a0944ab3f44263f688f644a5c37", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.199307986494499, "ground_truth": 0}, {"key": "dbceded6ea7d8a0944ab3f44263f688f644a5c37", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.7994423103988262, "ground_truth": 0}, {"key": "dbceded6ea7d8a0944ab3f44263f688f644a5c37", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.30569733651804715, "ground_truth": 0}, {"key": "dbceded6ea7d8a0944ab3f44263f688f644a5c37", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.36658973280651874, "ground_truth": 0}, {"key": "305a7272b28da5bc5574487ca0a09f48b852788c", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.5563995906724286, "ground_truth": 0}, {"key": "305a7272b28da5bc5574487ca0a09f48b852788c", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.8902942161485777, "ground_truth": 0}, {"key": "305a7272b28da5bc5574487ca0a09f48b852788c", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.4960938248584952, "ground_truth": 0}, {"key": "305a7272b28da5bc5574487ca0a09f48b852788c", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.505859111629508, "ground_truth": 0}, {"key": "305a7272b28da5bc5574487ca0a09f48b852788c", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.2213506808907886, "ground_truth": 0}, {"key": "9814600b03458475607fa2e4e9f1637138b7c9bf", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.2974699281427758, "ground_truth": 0}, {"key": "9814600b03458475607fa2e4e9f1637138b7c9bf", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.9462003564198314, "ground_truth": 0}, {"key": "9814600b03458475607fa2e4e9f1637138b7c9bf", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.8624675281851725, "ground_truth": 0}, {"key": "9814600b03458475607fa2e4e9f1637138b7c9bf", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.2958398800892408, "ground_truth": 0}, {"key": "9814600b03458475607fa2e4e9f1637138b7c9bf", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.3123699813579869, "ground_truth": 0}, {"key": "d16bff688345742ee8a1762cb6b82b49e4a065dd", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.583203358636593, "ground_truth": 0}, {"key": "d16bff688345742ee8a1762cb6b82b49e4a065dd", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.6424324644072248, "ground_truth": 0}, {"key": "d16bff688345742ee8a1762cb6b82b49e4a065dd", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.47463117208847877, "ground_truth": 0}, {"key": "d16bff688345742ee8a1762cb6b82b49e4a065dd", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.6206216290835835, "ground_truth": 0}, {"key": "d16bff688345742ee8a1762cb6b82b49e4a065dd", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.4804787011785538, "ground_truth": 0}, {"key": "c85a7eb698c39c7465d1fe4ebbb50447329b5497", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.8902942232809667, "ground_truth": 0}, {"key": "c85a7eb698c39c7465d1fe4ebbb50447329b5497", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.9755769128600491, "ground_truth": 0}, {"key": "c85a7eb698c39c7465d1fe4ebbb50447329b5497", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.8879840483303113, "ground_truth": 0}, {"key": "c85a7eb698c39c7465d1fe4ebbb50447329b5497", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.8449215224447049, "ground_truth": 0}, {"key": "c85a7eb698c39c7465d1fe4ebbb50447329b5497", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.9974291322016277, "ground_truth": 0}, {"key": "5f299d74b492be5e53e6bcf3a54d3c8a4b418a97", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.5214711772058873, "ground_truth": 0}, {"key": "5f299d74b492be5e53e6bcf3a54d3c8a4b418a97", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.472683466525475, "ground_truth": 0}, {"key": "5f299d74b492be5e53e6bcf3a54d3c8a4b418a97", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.1540575677233976, "ground_truth": 0}, {"key": "5f299d74b492be5e53e6bcf3a54d3c8a4b418a97", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.4016877938040083, "ground_truth": 0}, {"key": "5f299d74b492be5e53e6bcf3a54d3c8a4b418a97", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.2958398611889167, "ground_truth": 0}, {"key": "5a4e46a4e18d31d1ef4d1087b1643a349f10dd14", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.38861804027243274, "ground_truth": 0}, {"key": "5a4e46a4e18d31d1ef4d1087b1643a349f10dd14", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.7704648028261972, "ground_truth": 0}, {"key": "5a4e46a4e18d31d1ef4d1087b1643a349f10dd14", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.2465333539140262, "ground_truth": 0}, {"key": "5a4e46a4e18d31d1ef4d1087b1643a349f10dd14", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.505859088965936, "ground_truth": 0}, {"key": "5a4e46a4e18d31d1ef4d1087b1643a349f10dd14", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.4843801067349979, "ground_truth": 0}, {"key": "b6b7cbc40f51483708d53416719205f36c06f6df", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.3225259740988846, "ground_truth": 0}, {"key": "b6b7cbc40f51483708d53416719205f36c06f6df", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.3629691918245145, "ground_truth": 0}, {"key": "b6b7cbc40f51483708d53416719205f36c06f6df", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.5563996046437462, "ground_truth": 0}, {"key": "b6b7cbc40f51483708d53416719205f36c06f6df", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.21866937519386445, "ground_truth": 0}, {"key": "b6b7cbc40f51483708d53416719205f36c06f6df", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.399811610962364, "ground_truth": 0}, {"key": "7c0bda3744be6f7d95eef695e59a4e4001455a35", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.3522017880520985, "ground_truth": 0}, {"key": "7c0bda3744be6f7d95eef695e59a4e4001455a35", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.4474602935141903, "ground_truth": 0}, {"key": "7c0bda3744be6f7d95eef695e59a4e4001455a35", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.8376199744114783, "ground_truth": 0}, {"key": "7c0bda3744be6f7d95eef695e59a4e4001455a35", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.370225389708633, "ground_truth": 0}, {"key": "7c0bda3744be6f7d95eef695e59a4e4001455a35", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.2798285038940977, "ground_truth": 0}, {"key": "f19b17438e69527f376e5d9efc74d19fbac6f755", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.14318770256738966, "ground_truth": 0}, {"key": "f19b17438e69527f376e5d9efc74d19fbac6f755", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.6513548584957843, "ground_truth": 0}, {"key": "f19b17438e69527f376e5d9efc74d19fbac6f755", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.2893717092763992, "ground_truth": 0}, {"key": "f19b17438e69527f376e5d9efc74d19fbac6f755", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.22270011132076073, "ground_truth": 0}, {"key": "f19b17438e69527f376e5d9efc74d19fbac6f755", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.32939172226164937, "ground_truth": 0}, {"key": "eb2fe21af9629392d61a4fabe6cad72130525f2f", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.3398275987165444, "ground_truth": 0}, {"key": "eb2fe21af9629392d61a4fabe6cad72130525f2f", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.4843800967011445, "ground_truth": 0}, {"key": "eb2fe21af9629392d61a4fabe6cad72130525f2f", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.6688802453793903, "ground_truth": 0}, {"key": "eb2fe21af9629392d61a4fabe6cad72130525f2f", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.3398276042121809, "ground_truth": 0}, {"key": "eb2fe21af9629392d61a4fabe6cad72130525f2f", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.5195213481217277, "ground_truth": 0}, {"key": "eebebdc4fa08a6e927ab958a39d91f888550afec", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.4843800948894024, "ground_truth": 0}, {"key": "eebebdc4fa08a6e927ab958a39d91f888550afec", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.7704648028261972, "ground_truth": 0}, {"key": "eebebdc4fa08a6e927ab958a39d91f888550afec", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.6388352949702237, "ground_truth": 0}, {"key": "eebebdc4fa08a6e927ab958a39d91f888550afec", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.32252598032537166, "ground_truth": 0}, {"key": "eebebdc4fa08a6e927ab958a39d91f888550afec", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.49218814060716154, "ground_truth": 0}, {"key": "94b15ad6efcd6d47dfcc242135be481fceb7f634", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.7853085897290201, "ground_truth": 0}, {"key": "94b15ad6efcd6d47dfcc242135be481fceb7f634", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.7549149662430251, "ground_truth": 0}, {"key": "94b15ad6efcd6d47dfcc242135be481fceb7f634", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.569852658335921, "ground_truth": 0}, {"key": "94b15ad6efcd6d47dfcc242135be481fceb7f634", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.7534666621111727, "ground_truth": 0}, {"key": "94b15ad6efcd6d47dfcc242135be481fceb7f634", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.6842640107030803, "ground_truth": 0}, {"key": "504ed83e41a6a861927345f7a027ba53ad02237a", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.44167300207660015, "ground_truth": 0}, {"key": "504ed83e41a6a861927345f7a027ba53ad02237a", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.39047582282256516, "ground_truth": 0}, {"key": "504ed83e41a6a861927345f7a027ba53ad02237a", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.5506073849827492, "ground_truth": 0}, {"key": "504ed83e41a6a861927345f7a027ba53ad02237a", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.23934936406832008, "ground_truth": 0}, {"key": "504ed83e41a6a861927345f7a027ba53ad02237a", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.5964331240598115, "ground_truth": 0}, {"key": "42176b852f897ae19ef0cf39d598878c8ff0bced", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.07751766329206074, "ground_truth": 0}, {"key": "42176b852f897ae19ef0cf39d598878c8ff0bced", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.09534947141323455, "ground_truth": 0}, {"key": "42176b852f897ae19ef0cf39d598878c8ff0bced", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.03067579964552882, "ground_truth": 0}, {"key": "42176b852f897ae19ef0cf39d598878c8ff0bced", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.09534945617051375, "ground_truth": 0}, {"key": "42176b852f897ae19ef0cf39d598878c8ff0bced", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.09138210179821776, "ground_truth": 0}, {"key": "62ac534bf7e3e897b2726dddf2b7b6f7723362d4", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.49609380783645624, "ground_truth": 0}, {"key": "62ac534bf7e3e897b2726dddf2b7b6f7723362d4", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.1540575688956472, "ground_truth": 0}, {"key": "62ac534bf7e3e897b2726dddf2b7b6f7723362d4", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.3073580214719324, "ground_truth": 0}, {"key": "62ac534bf7e3e897b2726dddf2b7b6f7723362d4", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.30239106659860604, "ground_truth": 0}, {"key": "62ac534bf7e3e897b2726dddf2b7b6f7723362d4", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.19072403241728242, "ground_truth": 0}, {"key": "4ff05ae8454ad482f81911c5e4275b63466bea35", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.20817892746605807, "ground_truth": 0}, {"key": "4ff05ae8454ad482f81911c5e4275b63466bea35", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.33633104166165567, "ground_truth": 0}, {"key": "4ff05ae8454ad482f81911c5e4275b63466bea35", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.18832399054811688, "ground_truth": 0}, {"key": "4ff05ae8454ad482f81911c5e4275b63466bea35", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.23651622907469594, "ground_truth": 0}, {"key": "4ff05ae8454ad482f81911c5e4275b63466bea35", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.5448014013863307, "ground_truth": 0}, {"key": "16e86dc5e3fe27875ee927741542536ea7b7553b", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.2845760101645294, "ground_truth": 0}, {"key": "16e86dc5e3fe27875ee927741542536ea7b7553b", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.3363310516630647, "ground_truth": 0}, {"key": "16e86dc5e3fe27875ee927741542536ea7b7553b", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.4455295272384748, "ground_truth": 0}, {"key": "16e86dc5e3fe27875ee927741542536ea7b7553b", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.31742627428525977, "ground_truth": 0}, {"key": "16e86dc5e3fe27875ee927741542536ea7b7553b", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.22541661347919506, "ground_truth": 0}, {"key": "ad55d2f13db6732edcd716e09f527ed2df39946f", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.39981162576752743, "ground_truth": 0}, {"key": "ad55d2f13db6732edcd716e09f527ed2df39946f", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.3415824773527372, "ground_truth": 0}, {"key": "ad55d2f13db6732edcd716e09f527ed2df39946f", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.3007455701464093, "ground_truth": 0}, {"key": "ad55d2f13db6732edcd716e09f527ed2df39946f", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.32252597012223894, "ground_truth": 0}, {"key": "ad55d2f13db6732edcd716e09f527ed2df39946f", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.33111974480536344, "ground_truth": 0}, {"key": "160228fe18f272761b969b08622ba868ad65b206", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.6388353017704295, "ground_truth": 0}, {"key": "160228fe18f272761b969b08622ba868ad65b206", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.6187804235812222, "ground_truth": 0}, {"key": "160228fe18f272761b969b08622ba868ad65b206", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.18242552711308713, "ground_truth": 0}, {"key": "160228fe18f272761b969b08622ba868ad65b206", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.2861692349321933, "ground_truth": 0}, {"key": "160228fe18f272761b969b08622ba868ad65b206", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.4668455874332702, "ground_truth": 0}, {"key": "7ebb75bc91aa51d53b06fdbed7feb52d42612065", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.5736783920973825, "ground_truth": 0}, {"key": "7ebb75bc91aa51d53b06fdbed7feb52d42612065", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.6706083090944678, "ground_truth": 0}, {"key": "7ebb75bc91aa51d53b06fdbed7feb52d42612065", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.7577943504622419, "ground_truth": 0}, {"key": "7ebb75bc91aa51d53b06fdbed7feb52d42612065", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.5370413901066596, "ground_truth": 0}, {"key": "7ebb75bc91aa51d53b06fdbed7feb52d42612065", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.585101128951747, "ground_truth": 0}, {"key": "a84e31bf36290e557a3080ad297177b6f18cdf84", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.6279512004209856, "ground_truth": 0}, {"key": "a84e31bf36290e557a3080ad297177b6f18cdf84", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.5563995647589842, "ground_truth": 0}, {"key": "a84e31bf36290e557a3080ad297177b6f18cdf84", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.24364243005506714, "ground_truth": 0}, {"key": "a84e31bf36290e557a3080ad297177b6f18cdf84", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.6601723992091101, "ground_truth": 0}, {"key": "a84e31bf36290e557a3080ad297177b6f18cdf84", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.49804686033127443, "ground_truth": 0}, {"key": "c43c7253f38ff2cd79770034ed9af3567cfaa811", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.5136684577599444, "ground_truth": 0}, {"key": "c43c7253f38ff2cd79770034ed9af3567cfaa811", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.42823340444003083, "ground_truth": 0}, {"key": "c43c7253f38ff2cd79770034ed9af3567cfaa811", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.4532618494665367, "ground_truth": 0}, {"key": "c43c7253f38ff2cd79770034ed9af3567cfaa811", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.45132651999519285, "ground_truth": 0}, {"key": "c43c7253f38ff2cd79770034ed9af3567cfaa811", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.39981163722374785, "ground_truth": 0}, {"key": "a4601415eafb5264a4bdc273de3a16365aefb35b", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.3486451515332017, "ground_truth": 0}, {"key": "a4601415eafb5264a4bdc273de3a16365aefb35b", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.5563996005109483, "ground_truth": 0}, {"key": "a4601415eafb5264a4bdc273de3a16365aefb35b", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.4054487396232195, "ground_truth": 0}, {"key": "a4601415eafb5264a4bdc273de3a16365aefb35b", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.3647775840414015, "ground_truth": 0}, {"key": "a4601415eafb5264a4bdc273de3a16365aefb35b", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.35756750482455363, "ground_truth": 0}, {"key": "91d43f137b3d928561fb62b200ae40aee4a34b73", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.5544704858992946, "ground_truth": 0}, {"key": "91d43f137b3d928561fb62b200ae40aee4a34b73", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.4532618630230259, "ground_truth": 0}, {"key": "91d43f137b3d928561fb62b200ae40aee4a34b73", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.37937838268986795, "ground_truth": 0}, {"key": "91d43f137b3d928561fb62b200ae40aee4a34b73", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.613236551101414, "ground_truth": 0}, {"key": "91d43f137b3d928561fb62b200ae40aee4a34b73", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.5717665895893124, "ground_truth": 0}, {"key": "ab2d99eedfd685ce685fa44e735695c27e946683", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.3363310675707191, "ground_truth": 0}, {"key": "ab2d99eedfd685ce685fa44e735695c27e946683", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.20561502381291571, "ground_truth": 0}, {"key": "ab2d99eedfd685ce685fa44e735695c27e946683", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.38491215824937774, "ground_truth": 0}, {"key": "ab2d99eedfd685ce685fa44e735695c27e946683", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.2893717132858995, "ground_truth": 0}, {"key": "ab2d99eedfd685ce685fa44e735695c27e946683", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.4668455892919241, "ground_truth": 0}, {"key": "df9c4e1b8698581720b28c71f1e98f82bd6ea6e6", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.45132652422043107, "ground_truth": 0}, {"key": "df9c4e1b8698581720b28c71f1e98f82bd6ea6e6", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.2893717052455667, "ground_truth": 0}, {"key": "df9c4e1b8698581720b28c71f1e98f82bd6ea6e6", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.3140505596363957, "ground_truth": 0}, {"key": "df9c4e1b8698581720b28c71f1e98f82bd6ea6e6", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.34864515059129486, "ground_truth": 0}, {"key": "df9c4e1b8698581720b28c71f1e98f82bd6ea6e6", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.22953522205169577, "ground_truth": 0}, {"key": "a1d7a119707506100920e1a6f0d9cbf4d4e7c838", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.4980468821561555, "ground_truth": 0}, {"key": "a1d7a119707506100920e1a6f0d9cbf4d4e7c838", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.3539862601228595, "ground_truth": 0}, {"key": "a1d7a119707506100920e1a6f0d9cbf4d4e7c838", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.5409238869401206, "ground_truth": 0}, {"key": "a1d7a119707506100920e1a6f0d9cbf4d4e7c838", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.33982761677880524, "ground_truth": 0}, {"key": "a1d7a119707506100920e1a6f0d9cbf4d4e7c838", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.3208212971191185, "ground_truth": 0}, {"key": "acd2b851b367bf62dd603ebff5670ffa9c853a8f", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.20689404195152536, "ground_truth": 0}, {"key": "acd2b851b367bf62dd603ebff5670ffa9c853a8f", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.40733340477899826, "ground_truth": 0}, {"key": "acd2b851b367bf62dd603ebff5670ffa9c853a8f", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.1980641627841756, "ground_truth": 0}, {"key": "acd2b851b367bf62dd603ebff5670ffa9c853a8f", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.2043419145969907, "ground_truth": 0}, {"key": "acd2b851b367bf62dd603ebff5670ffa9c853a8f", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.29421498390985357, "ground_truth": 0}, {"key": "b9f5a02386adb698ae71cadd3fd1825fa7b998db", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.11047115506981015, "ground_truth": 0}, {"key": "b9f5a02386adb698ae71cadd3fd1825fa7b998db", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.1015894416483922, "ground_truth": 0}, {"key": "b9f5a02386adb698ae71cadd3fd1825fa7b998db", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.06656919758688175, "ground_truth": 0}, {"key": "b9f5a02386adb698ae71cadd3fd1825fa7b998db", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.09739039407867287, "ground_truth": 0}, {"key": "b9f5a02386adb698ae71cadd3fd1825fa7b998db", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.18476750826366506, "ground_truth": 0}, {"key": "c26f356dc536e5797ba550be6e27a95059f1ce53", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.14706451221474992, "ground_truth": 0}, {"key": "c26f356dc536e5797ba550be6e27a95059f1ce53", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.3311197574558095, "ground_truth": 0}, {"key": "c26f356dc536e5797ba550be6e27a95059f1ce53", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.07640767787721105, "ground_truth": 0}, {"key": "c26f356dc536e5797ba550be6e27a95059f1ce53", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.09334687218903591, "ground_truth": 0}, {"key": "c26f356dc536e5797ba550be6e27a95059f1ce53", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.12678517585884055, "ground_truth": 0}, {"key": "94a9883a283e94c3ad53069d98517b08e8853447", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.2628418270998993, "ground_truth": 0}, {"key": "94a9883a283e94c3ad53069d98517b08e8853447", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.27982847923069437, "ground_truth": 0}, {"key": "94a9883a283e94c3ad53069d98517b08e8853447", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.1968262197464338, "ground_truth": 0}, {"key": "94a9883a283e94c3ad53069d98517b08e8853447", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.3259495229922296, "ground_truth": 0}, {"key": "94a9883a283e94c3ad53069d98517b08e8853447", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.35042138068844586, "ground_truth": 0}, {"key": "9c02ebeda5d84859eb36070de7e8a9517ac3fee6", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.656658277201622, "ground_truth": 0}, {"key": "9c02ebeda5d84859eb36070de7e8a9517ac3fee6", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.7772998731534448, "ground_truth": 0}, {"key": "9c02ebeda5d84859eb36070de7e8a9517ac3fee6", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.6740504978995246, "ground_truth": 0}, {"key": "9c02ebeda5d84859eb36070de7e8a9517ac3fee6", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.2974699632642963, "ground_truth": 0}, {"key": "9c02ebeda5d84859eb36070de7e8a9517ac3fee6", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.5640984978726988, "ground_truth": 0}, {"key": "37ab3a49bb7732e145a24e70e6f077469ca1dbd3", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.4960938282004817, "ground_truth": 0}, {"key": "37ab3a49bb7732e145a24e70e6f077469ca1dbd3", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.48633152893882176, "ground_truth": 0}, {"key": "37ab3a49bb7732e145a24e70e6f077469ca1dbd3", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.8344068980872063, "ground_truth": 0}, {"key": "37ab3a49bb7732e145a24e70e6f077469ca1dbd3", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.3433417494313408, "ground_truth": 0}, {"key": "37ab3a49bb7732e145a24e70e6f077469ca1dbd3", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.5583270121664847, "ground_truth": 0}, {"key": "fa67b52d4597e227947776fd40a4b16f402ed12d", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.38861801082828845, "ground_truth": 0}, {"key": "fa67b52d4597e227947776fd40a4b16f402ed12d", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.18594718449636502, "ground_truth": 0}, {"key": "fa67b52d4597e227947776fd40a4b16f402ed12d", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.13206616457967446, "ground_truth": 0}, {"key": "fa67b52d4597e227947776fd40a4b16f402ed12d", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.36477753006937347, "ground_truth": 0}, {"key": "fa67b52d4597e227947776fd40a4b16f402ed12d", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.49609385335816647, "ground_truth": 0}, {"key": "cafb6a9801a85984042abcd7e552d1e129dff4cf", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.3886180297378507, "ground_truth": 0}, {"key": "cafb6a9801a85984042abcd7e552d1e129dff4cf", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.3451052771925687, "ground_truth": 0}, {"key": "cafb6a9801a85984042abcd7e552d1e129dff4cf", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.25683199578405685, "ground_truth": 0}, {"key": "cafb6a9801a85984042abcd7e552d1e129dff4cf", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.350421398223107, "ground_truth": 0}, {"key": "cafb6a9801a85984042abcd7e552d1e129dff4cf", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.5234203601328586, "ground_truth": 0}, {"key": "12a24b1aba082a5fd0687a14015e1e58090ed9c6", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.6460137162139368, "ground_truth": 0}, {"key": "12a24b1aba082a5fd0687a14015e1e58090ed9c6", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.4244120015126366, "ground_truth": 0}, {"key": "12a24b1aba082a5fd0687a14015e1e58090ed9c6", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.41300356888314466, "ground_truth": 0}, {"key": "12a24b1aba082a5fd0687a14015e1e58090ed9c6", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.5, "ground_truth": 0}, {"key": "12a24b1aba082a5fd0687a14015e1e58090ed9c6", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.2766905368473033, "ground_truth": 0}, {"key": "c8ebf6f48257a704202c7b6df238bc1cbfa838d7", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.6513548555882288, "ground_truth": 0}, {"key": "c8ebf6f48257a704202c7b6df238bc1cbfa838d7", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.8300437699372186, "ground_truth": 0}, {"key": "c8ebf6f48257a704202c7b6df238bc1cbfa838d7", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.724870242809105, "ground_truth": 0}, {"key": "c8ebf6f48257a704202c7b6df238bc1cbfa838d7", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.6859494239642079, "ground_truth": 0}, {"key": "c8ebf6f48257a704202c7b6df238bc1cbfa838d7", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.7534666530660435, "ground_truth": 0}, {"key": "48e858dcb8dd62aad328f2c5f7fa052893d7304b", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.1250653875926069, "ground_truth": 0}, {"key": "48e858dcb8dd62aad328f2c5f7fa052893d7304b", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.08389038155106933, "ground_truth": 0}, {"key": "48e858dcb8dd62aad328f2c5f7fa052893d7304b", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.12336562203669663, "ground_truth": 0}, {"key": "48e858dcb8dd62aad328f2c5f7fa052893d7304b", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.26740816373760995, "ground_truth": 0}, {"key": "48e858dcb8dd62aad328f2c5f7fa052893d7304b", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.12252321947784968, "ground_truth": 0}, {"key": "1522da440cb538c8fc60f254efcb65e8378065a1", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.5292633913654315, "ground_truth": 0}, {"key": "1522da440cb538c8fc60f254efcb65e8378065a1", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.48633155876485434, "ground_truth": 0}, {"key": "1522da440cb538c8fc60f254efcb65e8378065a1", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.5964331516981478, "ground_truth": 0}, {"key": "1522da440cb538c8fc60f254efcb65e8378065a1", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.6706083034036183, "ground_truth": 0}, {"key": "1522da440cb538c8fc60f254efcb65e8378065a1", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.5, "ground_truth": 0}, {"key": "0b40c6061cfd6a745886150c46eb75a7f43b4efa", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.5467381521313889, "ground_truth": 0}, {"key": "0b40c6061cfd6a745886150c46eb75a7f43b4efa", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.6279512201975818, "ground_truth": 0}, {"key": "0b40c6061cfd6a745886150c46eb75a7f43b4efa", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.7676898653306694, "ground_truth": 0}, {"key": "0b40c6061cfd6a745886150c46eb75a7f43b4efa", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.6566582677374537, "ground_truth": 0}, {"key": "0b40c6061cfd6a745886150c46eb75a7f43b4efa", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.46101677150193193, "ground_truth": 0}, {"key": "730655d5d1f29496344388805a891c3e3fd2a64e", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.2751297152434967, "ground_truth": 0}, {"key": "730655d5d1f29496344388805a891c3e3fd2a64e", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.1276526293226084, "ground_truth": 0}, {"key": "730655d5d1f29496344388805a891c3e3fd2a64e", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.430147358792051, "ground_truth": 0}, {"key": "730655d5d1f29496344388805a891c3e3fd2a64e", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.21733753032652994, "ground_truth": 0}, {"key": "730655d5d1f29496344388805a891c3e3fd2a64e", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.28140560154990496, "ground_truth": 0}, {"key": "399877dd5e90d151e29ad67fdeb6fa093632e0e1", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.3593641464538471, "ground_truth": 0}, {"key": "399877dd5e90d151e29ad67fdeb6fa093632e0e1", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.41300357489685724, "ground_truth": 0}, {"key": "399877dd5e90d151e29ad67fdeb6fa093632e0e1", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.3363310366125216, "ground_truth": 0}, {"key": "399877dd5e90d151e29ad67fdeb6fa093632e0e1", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.2766905269152696, "ground_truth": 0}, {"key": "399877dd5e90d151e29ad67fdeb6fa093632e0e1", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.43398146889688693, "ground_truth": 0}, {"key": "67fc9fa49a2c443dcbab030b9c6247a662716bc9", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.18594717998417765, "ground_truth": 0}, {"key": "67fc9fa49a2c443dcbab030b9c6247a662716bc9", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.2479874214747305, "ground_truth": 0}, {"key": "67fc9fa49a2c443dcbab030b9c6247a662716bc9", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.2568319758125872, "ground_truth": 0}, {"key": "67fc9fa49a2c443dcbab030b9c6247a662716bc9", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.25238404447712015, "ground_truth": 0}, {"key": "67fc9fa49a2c443dcbab030b9c6247a662716bc9", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.4687906100970538, "ground_truth": 0}, {"key": "8a44f223fc67ed0d5f946517f77c2291d6c4a027", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.2958398769782534, "ground_truth": 0}, {"key": "8a44f223fc67ed0d5f946517f77c2291d6c4a027", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.17328819742974805, "ground_truth": 0}, {"key": "8a44f223fc67ed0d5f946517f77c2291d6c4a027", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.21076629757889337, "ground_truth": 0}, {"key": "8a44f223fc67ed0d5f946517f77c2291d6c4a027", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.07211220564918713, "ground_truth": 0}, {"key": "8a44f223fc67ed0d5f946517f77c2291d6c4a027", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.30404166298333085, "ground_truth": 0}, {"key": "a3906e4f27942e2742d5cc9a3241980e338e0d30", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.3757064553171698, "ground_truth": 0}, {"key": "a3906e4f27942e2742d5cc9a3241980e338e0d30", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.48438007905656183, "ground_truth": 0}, {"key": "a3906e4f27942e2742d5cc9a3241980e338e0d30", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.4863315246920191, "ground_truth": 0}, {"key": "a3906e4f27942e2742d5cc9a3241980e338e0d30", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.5097643639865098, "ground_truth": 0}, {"key": "a3906e4f27942e2742d5cc9a3241980e338e0d30", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.461016786740064, "ground_truth": 0}, {"key": "1e9f089602e8ab42ae65e273d866b53bdf9501bc", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.8670357667598154, "ground_truth": 0}, {"key": "1e9f089602e8ab42ae65e273d866b53bdf9501bc", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.488283382698349, "ground_truth": 0}, {"key": "1e9f089602e8ab42ae65e273d866b53bdf9501bc", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.7634837613865926, "ground_truth": 0}, {"key": "1e9f089602e8ab42ae65e273d866b53bdf9501bc", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.6926419747044136, "ground_truth": 0}, {"key": "1e9f089602e8ab42ae65e273d866b53bdf9501bc", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.7981867897057564, "ground_truth": 0}, {"key": "768682d2f556e103bad77ad7aaa0660181747d1c", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.1294027299343516, "ground_truth": 0}, {"key": "768682d2f556e103bad77ad7aaa0660181747d1c", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.16026603307649098, "ground_truth": 0}, {"key": "768682d2f556e103bad77ad7aaa0660181747d1c", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.11436852599475768, "ground_truth": 0}, {"key": "768682d2f556e103bad77ad7aaa0660181747d1c", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.43974734951638245, "ground_truth": 0}, {"key": "768682d2f556e103bad77ad7aaa0660181747d1c", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.4707366163365632, "ground_truth": 0}, {"key": "2806f716e41ce224a3862eb2bc50e214bc5037d8", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.19930797948570553, "ground_truth": 0}, {"key": "2806f716e41ce224a3862eb2bc50e214bc5037d8", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.8910549485690863, "ground_truth": 0}, {"key": "2806f716e41ce224a3862eb2bc50e214bc5037d8", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.2523840348551958, "ground_truth": 0}, {"key": "2806f716e41ce224a3862eb2bc50e214bc5037d8", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.2720245343664107, "ground_truth": 0}, {"key": "2806f716e41ce224a3862eb2bc50e214bc5037d8", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.27357437509699617, "ground_truth": 0}, {"key": "49d1a193a2c477f5861b593f06681b35b0e49573", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.5736784358971899, "ground_truth": 0}, {"key": "49d1a193a2c477f5861b593f06681b35b0e49573", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.6150878660872553, "ground_truth": 0}, {"key": "49d1a193a2c477f5861b593f06681b35b0e49573", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.445529523223178, "ground_truth": 0}, {"key": "49d1a193a2c477f5861b593f06681b35b0e49573", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.5292634181249877, "ground_truth": 0}, {"key": "49d1a193a2c477f5861b593f06681b35b0e49573", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.6893056140036731, "ground_truth": 0}, {"key": "d603649af5260edbbe0474bcbb2e83e7340372d3", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.531209381998886, "ground_truth": 0}, {"key": "d603649af5260edbbe0474bcbb2e83e7340372d3", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.40544876445597616, "ground_truth": 0}, {"key": "d603649af5260edbbe0474bcbb2e83e7340372d3", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.5, "ground_truth": 0}, {"key": "d603649af5260edbbe0474bcbb2e83e7340372d3", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.6001883607046626, "ground_truth": 0}, {"key": "d603649af5260edbbe0474bcbb2e83e7340372d3", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.6370307876970924, "ground_truth": 0}, {"key": "241c3bfcde3e19fb8f0e5d0273ccb06155a2d86b", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.10087861166720619, "ground_truth": 0}, {"key": "241c3bfcde3e19fb8f0e5d0273ccb06155a2d86b", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.1895210852035155, "ground_truth": 0}, {"key": "241c3bfcde3e19fb8f0e5d0273ccb06155a2d86b", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.27512973259156165, "ground_truth": 0}, {"key": "241c3bfcde3e19fb8f0e5d0273ccb06155a2d86b", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.13386749192019137, "ground_truth": 0}, {"key": "241c3bfcde3e19fb8f0e5d0273ccb06155a2d86b", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.26588046749709904, "ground_truth": 0}, {"key": "cc8898d831bb770da703c284d4a811f16cb4035b", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.4804786720544584, "ground_truth": 0}, {"key": "cc8898d831bb770da703c284d4a811f16cb4035b", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.6992544104012044, "ground_truth": 0}, {"key": "cc8898d831bb770da703c284d4a811f16cb4035b", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.668880247937761, "ground_truth": 0}, {"key": "cc8898d831bb770da703c284d4a811f16cb4035b", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.7606506598175449, "ground_truth": 0}, {"key": "cc8898d831bb770da703c284d4a811f16cb4035b", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.7041601556631546, "ground_truth": 0}, {"key": "e5685719d330bf84ed7691a9a591e04e6a6226b8", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.5774953555991649, "ground_truth": 0}, {"key": "e5685719d330bf84ed7691a9a591e04e6a6226b8", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.5774953482382893, "ground_truth": 0}, {"key": "e5685719d330bf84ed7691a9a591e04e6a6226b8", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.598312163697792, "ground_truth": 0}, {"key": "e5685719d330bf84ed7691a9a591e04e6a6226b8", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.6688802545592735, "ground_truth": 0}, {"key": "e5685719d330bf84ed7691a9a591e04e6a6226b8", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.8198933125124479, "ground_truth": 0}, {"key": "bc868bcd37d2463875c4c685c582449069992a76", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.5544704648131628, "ground_truth": 0}, {"key": "bc868bcd37d2463875c4c685c582449069992a76", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.602061602580734, "ground_truth": 0}, {"key": "bc868bcd37d2463875c4c685c582449069992a76", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.5794004131730642, "ground_truth": 0}, {"key": "bc868bcd37d2463875c4c685c582449069992a76", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.37387580956176136, "ground_truth": 0}, {"key": "bc868bcd37d2463875c4c685c582449069992a76", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.3380771349100997, "ground_truth": 0}, {"key": "c6369011986d295ce197e7304e14b207dab4c0aa", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.08509904414141578, "ground_truth": 0}, {"key": "c6369011986d295ce197e7304e14b207dab4c0aa", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.07159119877789033, "ground_truth": 0}, {"key": "c6369011986d295ce197e7304e14b207dab4c0aa", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.6242935305559373, "ground_truth": 0}, {"key": "c6369011986d295ce197e7304e14b207dab4c0aa", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.08269733797145663, "ground_truth": 0}, {"key": "c6369011986d295ce197e7304e14b207dab4c0aa", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.11124121232446288, "ground_truth": 0}, {"key": "c4e4f565d15f76b1e367d4fc2e7a2648c3cd395c", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.05419873057870466, "ground_truth": 0}, {"key": "c4e4f565d15f76b1e367d4fc2e7a2648c3cd395c", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.4016877986139429, "ground_truth": 0}, {"key": "c4e4f565d15f76b1e367d4fc2e7a2648c3cd395c", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.08210662540793802, "ground_truth": 0}, {"key": "c4e4f565d15f76b1e367d4fc2e7a2648c3cd395c", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.1403362574977103, "ground_truth": 0}, {"key": "c4e4f565d15f76b1e367d4fc2e7a2648c3cd395c", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.21076629751828702, "ground_truth": 0}, {"key": "32fe9f0f2eedaf63c9fd0314ab92c4b46297e260", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.2766905213125853, "ground_truth": 0}, {"key": "32fe9f0f2eedaf63c9fd0314ab92c4b46297e260", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.5078118552546772, "ground_truth": 0}, {"key": "32fe9f0f2eedaf63c9fd0314ab92c4b46297e260", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.4493926243521721, "ground_truth": 0}, {"key": "32fe9f0f2eedaf63c9fd0314ab92c4b46297e260", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.46101679388050965, "ground_truth": 0}, {"key": "32fe9f0f2eedaf63c9fd0314ab92c4b46297e260", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.7534666529002598, "ground_truth": 0}, {"key": "41698f361bcf6415f711719ed0c2f6817205c091", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.3702253766371196, "ground_truth": 0}, {"key": "41698f361bcf6415f711719ed0c2f6817205c091", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.5389832223487622, "ground_truth": 0}, {"key": "41698f361bcf6415f711719ed0c2f6817205c091", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.44167296735662376, "ground_truth": 0}, {"key": "41698f361bcf6415f711719ed0c2f6817205c091", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.4130035578597945, "ground_truth": 0}, {"key": "41698f361bcf6415f711719ed0c2f6817205c091", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.5136684579394175, "ground_truth": 0}, {"key": "f040d657ee146cd131d34aeb31d6728b4f996666", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.2173375173940605, "ground_truth": 0}, {"key": "f040d657ee146cd131d34aeb31d6728b4f996666", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.2735743837810272, "ground_truth": 0}, {"key": "f040d657ee146cd131d34aeb31d6728b4f996666", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.24944723076016698, "ground_truth": 0}, {"key": "f040d657ee146cd131d34aeb31d6728b4f996666", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.5736784066513362, "ground_truth": 0}, {"key": "f040d657ee146cd131d34aeb31d6728b4f996666", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.2861692427877785, "ground_truth": 0}, {"key": "1823e1e750046606e4be0e8710f1d74998783e41", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.7704647874494679, "ground_truth": 0}, {"key": "1823e1e750046606e4be0e8710f1d74998783e41", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.49414092212333305, "ground_truth": 0}, {"key": "1823e1e750046606e4be0e8710f1d74998783e41", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.7106283375545921, "ground_truth": 0}, {"key": "1823e1e750046606e4be0e8710f1d74998783e41", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.43398143291416874, "ground_truth": 0}, {"key": "1823e1e750046606e4be0e8710f1d74998783e41", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.7090191421754571, "ground_truth": 0}, {"key": "6fae638166ee95509fbab3b28ac1c0ba0b088c79", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.33285231689170625, "ground_truth": 0}, {"key": "6fae638166ee95509fbab3b28ac1c0ba0b088c79", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.3242353859175016, "ground_truth": 0}, {"key": "6fae638166ee95509fbab3b28ac1c0ba0b088c79", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.6513548739545096, "ground_truth": 0}, {"key": "6fae638166ee95509fbab3b28ac1c0ba0b088c79", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.1634454353812983, "ground_truth": 0}, {"key": "6fae638166ee95509fbab3b28ac1c0ba0b088c79", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.3157359788863288, "ground_truth": 0}, {"key": "00be40289d0aea65afd2da6431db8a9fc8efc9c0", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.25238403939871024, "ground_truth": 0}, {"key": "00be40289d0aea65afd2da6431db8a9fc8efc9c0", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.8116760095215081, "ground_truth": 0}, {"key": "00be40289d0aea65afd2da6431db8a9fc8efc9c0", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.33285231665386555, "ground_truth": 0}, {"key": "00be40289d0aea65afd2da6431db8a9fc8efc9c0", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.42059959887520293, "ground_truth": 0}, {"key": "00be40289d0aea65afd2da6431db8a9fc8efc9c0", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.18832398341995368, "ground_truth": 0}, {"key": "50dc0ca6cbbd4f9c3761fbb3ad9e7d7ba85bd9b3", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.23934934740103536, "ground_truth": 0}, {"key": "50dc0ca6cbbd4f9c3761fbb3ad9e7d7ba85bd9b3", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.6334102583465966, "ground_truth": 0}, {"key": "50dc0ca6cbbd4f9c3761fbb3ad9e7d7ba85bd9b3", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.38676344906504373, "ground_truth": 0}, {"key": "50dc0ca6cbbd4f9c3761fbb3ad9e7d7ba85bd9b3", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.7401743682860813, "ground_truth": 0}, {"key": "50dc0ca6cbbd4f9c3761fbb3ad9e7d7ba85bd9b3", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.27357439049271187, "ground_truth": 0}, {"key": "28b0e5240a7c3088fc62a70628b146bb40b6b853", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.3849121356053363, "ground_truth": 0}, {"key": "28b0e5240a7c3088fc62a70628b146bb40b6b853", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.9161096048212904, "ground_truth": 0}, {"key": "28b0e5240a7c3088fc62a70628b146bb40b6b853", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.5525397186201886, "ground_truth": 0}, {"key": "28b0e5240a7c3088fc62a70628b146bb40b6b853", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.38861801851794764, "ground_truth": 0}, {"key": "28b0e5240a7c3088fc62a70628b146bb40b6b853", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.5409238649529543, "ground_truth": 0}, {"key": "44bdf9aa9712197110017fca533785653210f1ea", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.6297746235185548, "ground_truth": 0}, {"key": "44bdf9aa9712197110017fca533785653210f1ea", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.5467381567257465, "ground_truth": 0}, {"key": "44bdf9aa9712197110017fca533785653210f1ea", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.48828339009851024, "ground_truth": 0}, {"key": "44bdf9aa9712197110017fca533785653210f1ea", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.7690802511524835, "ground_truth": 0}, {"key": "44bdf9aa9712197110017fca533785653210f1ea", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.4035668471988055, "ground_truth": 0}, {"key": "879e68a2b78b3cf3f5c2581bbf6093871143ed7b", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.7563575369299299, "ground_truth": 0}, {"key": "879e68a2b78b3cf3f5c2581bbf6093871143ed7b", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.5794004270215347, "ground_truth": 0}, {"key": "879e68a2b78b3cf3f5c2581bbf6093871143ed7b", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.40544873219597527, "ground_truth": 0}, {"key": "879e68a2b78b3cf3f5c2581bbf6093871143ed7b", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.6926419799179958, "ground_truth": 0}, {"key": "879e68a2b78b3cf3f5c2581bbf6093871143ed7b", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.6943026493941727, "ground_truth": 0}, {"key": "980051ddbf137ec06e7aeead2acb598bae388520", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.513668483619605, "ground_truth": 0}, {"key": "980051ddbf137ec06e7aeead2acb598bae388520", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.7634837423635897, "ground_truth": 0}, {"key": "980051ddbf137ec06e7aeead2acb598bae388520", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.5755879885056657, "ground_truth": 0}, {"key": "980051ddbf137ec06e7aeead2acb598bae388520", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.5019530857570834, "ground_truth": 0}, {"key": "980051ddbf137ec06e7aeead2acb598bae388520", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.6992544177568769, "ground_truth": 0}, {"key": "45b9fb89ac2724f2d7de56b2f8c9397bca03326e", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.1267851836426405, "ground_truth": 0}, {"key": "45b9fb89ac2724f2d7de56b2f8c9397bca03326e", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.28298811346205094, "ground_truth": 0}, {"key": "45b9fb89ac2724f2d7de56b2f8c9397bca03326e", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.6150878688302517, "ground_truth": 0}, {"key": "45b9fb89ac2724f2d7de56b2f8c9397bca03326e", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.6406358595920395, "ground_truth": 0}, {"key": "45b9fb89ac2724f2d7de56b2f8c9397bca03326e", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.6187804512458198, "ground_truth": 0}, {"key": "b427165e1be5e9b6e6067fc5f6591c02bfb93333", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.15921741874239378, "ground_truth": 0}, {"key": "b427165e1be5e9b6e6067fc5f6591c02bfb93333", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.47073661442960124, "ground_truth": 0}, {"key": "b427165e1be5e9b6e6067fc5f6591c02bfb93333", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.22000709173588862, "ground_truth": 0}, {"key": "b427165e1be5e9b6e6067fc5f6591c02bfb93333", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.32939169136872837, "ground_truth": 0}, {"key": "b427165e1be5e9b6e6067fc5f6591c02bfb93333", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.2845760049380057, "ground_truth": 0}, {"key": "a9a2880bd65c6b3835d19987ebcbd3d09010a0c3", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.1955941035610523, "ground_truth": 0}, {"key": "a9a2880bd65c6b3835d19987ebcbd3d09010a0c3", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.14128141402586608, "ground_truth": 0}, {"key": "a9a2880bd65c6b3835d19987ebcbd3d09010a0c3", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.31405052564025215, "ground_truth": 0}, {"key": "a9a2880bd65c6b3835d19987ebcbd3d09010a0c3", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.19314738635488443, "ground_truth": 0}, {"key": "a9a2880bd65c6b3835d19987ebcbd3d09010a0c3", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.16026604485438214, "ground_truth": 0}, {"key": "0c67e8d5a91f3c7d9c53e29b8d0a25cf8db21b54", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.21733752775895984, "ground_truth": 0}, {"key": "0c67e8d5a91f3c7d9c53e29b8d0a25cf8db21b54", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.3849121818798447, "ground_truth": 0}, {"key": "0c67e8d5a91f3c7d9c53e29b8d0a25cf8db21b54", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.3225259723513428, "ground_truth": 0}, {"key": "0c67e8d5a91f3c7d9c53e29b8d0a25cf8db21b54", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.5717665882210722, "ground_truth": 0}, {"key": "0c67e8d5a91f3c7d9c53e29b8d0a25cf8db21b54", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.3345894304640403, "ground_truth": 0}, {"key": "bc1c4d12aabdcecab3d87c6f9a898e41c7cd3821", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.5813031231549357, "ground_truth": 0}, {"key": "bc1c4d12aabdcecab3d87c6f9a898e41c7cd3821", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.9105453969197631, "ground_truth": 0}, {"key": "bc1c4d12aabdcecab3d87c6f9a898e41c7cd3821", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.6424325150185479, "ground_truth": 0}, {"key": "bc1c4d12aabdcecab3d87c6f9a898e41c7cd3821", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.6723317043957837, "ground_truth": 0}, {"key": "bc1c4d12aabdcecab3d87c6f9a898e41c7cd3821", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.6636689396186974, "ground_truth": 0}, {"key": "7b76a0b5e6006587b65ad70ac2e4953ca1e2d4d1", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.49804692856420774, "ground_truth": 0}, {"key": "7b76a0b5e6006587b65ad70ac2e4953ca1e2d4d1", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.5774954075301645, "ground_truth": 0}, {"key": "7b76a0b5e6006587b65ad70ac2e4953ca1e2d4d1", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.5331544123271345, "ground_truth": 0}, {"key": "7b76a0b5e6006587b65ad70ac2e4953ca1e2d4d1", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.3904758364157466, "ground_truth": 0}, {"key": "7b76a0b5e6006587b65ad70ac2e4953ca1e2d4d1", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.33982760512887433, "ground_truth": 0}, {"key": "8a0976b5b0811c919669e8aed7274e1d0fa14679", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.18359361671237404, "ground_truth": 0}, {"key": "8a0976b5b0811c919669e8aed7274e1d0fa14679", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.3259494973909677, "ground_truth": 0}, {"key": "8a0976b5b0811c919669e8aed7274e1d0fa14679", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.6224593251803132, "ground_truth": 0}, {"key": "8a0976b5b0811c919669e8aed7274e1d0fa14679", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.4668455928928741, "ground_truth": 0}, {"key": "8a0976b5b0811c919669e8aed7274e1d0fa14679", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.1480471975002864, "ground_truth": 0}, {"key": "69788d586d71bf36d2818ca097308747f6ab25ab", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.31405051329996103, "ground_truth": 0}, {"key": "69788d586d71bf36d2818ca097308747f6ab25ab", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.37754066317712226, "ground_truth": 0}, {"key": "69788d586d71bf36d2818ca097308747f6ab25ab", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.17895589372824713, "ground_truth": 0}, {"key": "69788d586d71bf36d2818ca097308747f6ab25ab", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.19806415832282886, "ground_truth": 0}, {"key": "69788d586d71bf36d2818ca097308747f6ab25ab", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.5331544237547761, "ground_truth": 0}, {"key": "82e9c77478dfed129ceca1a152ba54e20f7f5a88", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.38121956533181983, "ground_truth": 0}, {"key": "82e9c77478dfed129ceca1a152ba54e20f7f5a88", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.569852642922379, "ground_truth": 0}, {"key": "82e9c77478dfed129ceca1a152ba54e20f7f5a88", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.3611647232837148, "ground_truth": 0}, {"key": "82e9c77478dfed129ceca1a152ba54e20f7f5a88", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.37937839698957854, "ground_truth": 0}, {"key": "82e9c77478dfed129ceca1a152ba54e20f7f5a88", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.3056973449774946, "ground_truth": 0}, {"key": "e1b904fd0a3f74c3e01831acb6d4a67c0d1b642b", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.3886180077923552, "ground_truth": 0}, {"key": "e1b904fd0a3f74c3e01831acb6d4a67c0d1b642b", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.39981164143618725, "ground_truth": 0}, {"key": "e1b904fd0a3f74c3e01831acb6d4a67c0d1b642b", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.5058590773586579, "ground_truth": 0}, {"key": "e1b904fd0a3f74c3e01831acb6d4a67c0d1b642b", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.25238403994843056, "ground_truth": 0}, {"key": "e1b904fd0a3f74c3e01831acb6d4a67c0d1b642b", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.38306417196014736, "ground_truth": 0}, {"key": "1cecb5f24805afcc15eb5cfa0500130f107c8bcb", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.4148988380039138, "ground_truth": 0}, {"key": "1cecb5f24805afcc15eb5cfa0500130f107c8bcb", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.27669052652240556, "ground_truth": 0}, {"key": "1cecb5f24805afcc15eb5cfa0500130f107c8bcb", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.3849121420814068, "ground_truth": 0}, {"key": "1cecb5f24805afcc15eb5cfa0500130f107c8bcb", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.3665897452518312, "ground_truth": 0}, {"key": "1cecb5f24805afcc15eb5cfa0500130f107c8bcb", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.2240554454467254, "ground_truth": 0}, {"key": "d3da69405b687367de6260d74db8726423b6884a", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.36658973230476755, "ground_truth": 0}, {"key": "d3da69405b687367de6260d74db8726423b6884a", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.4843800970850151, "ground_truth": 0}, {"key": "d3da69405b687367de6260d74db8726423b6884a", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.4493926389284962, "ground_truth": 0}, {"key": "d3da69405b687367de6260d74db8726423b6884a", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.3665897082866631, "ground_truth": 0}, {"key": "d3da69405b687367de6260d74db8726423b6884a", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.41489886850221597, "ground_truth": 0}, {"key": "9b7836ba179053fecec671168589694bd4ba08f1", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.602061594498252, "ground_truth": 0}, {"key": "9b7836ba179053fecec671168589694bd4ba08f1", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.5621764893440548, "ground_truth": 0}, {"key": "9b7836ba179053fecec671168589694bd4ba08f1", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.8187367824264719, "ground_truth": 0}, {"key": "9b7836ba179053fecec671168589694bd4ba08f1", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.5234203493344255, "ground_truth": 0}, {"key": "9b7836ba179053fecec671168589694bd4ba08f1", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.6057990542361569, "ground_truth": 0}, {"key": "9483ae6d83dd71a96e91eee727a9ce7c0f3cf6ab", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.9860442885199938, "ground_truth": 0}, {"key": "9483ae6d83dd71a96e91eee727a9ce7c0f3cf6ab", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.9681411463539135, "ground_truth": 0}, {"key": "9483ae6d83dd71a96e91eee727a9ce7c0f3cf6ab", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.9683812336330208, "ground_truth": 0}, {"key": "9483ae6d83dd71a96e91eee727a9ce7c0f3cf6ab", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.9529258255834686, "ground_truth": 0}, {"key": "9483ae6d83dd71a96e91eee727a9ce7c0f3cf6ab", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.9525741353044952, "ground_truth": 0}, {"key": "ea29e498c303964fc39c856ddf7037d5dfbc93fb", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.11920291903511561, "ground_truth": 0}, {"key": "ea29e498c303964fc39c856ddf7037d5dfbc93fb", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.3738758358999858, "ground_truth": 0}, {"key": "ea29e498c303964fc39c856ddf7037d5dfbc93fb", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.1460872513398328, "ground_truth": 0}, {"key": "ea29e498c303964fc39c856ddf7037d5dfbc93fb", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.18359361519025075, "ground_truth": 0}, {"key": "ea29e498c303964fc39c856ddf7037d5dfbc93fb", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.2991052022615181, "ground_truth": 0}, {"key": "e1aad9da59a32a4443010b092eba1b68725c8467", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.5234203218945338, "ground_truth": 0}, {"key": "e1aad9da59a32a4443010b092eba1b68725c8467", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.3468730762340629, "ground_truth": 0}, {"key": "e1aad9da59a32a4443010b092eba1b68725c8467", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.182425518519059, "ground_truth": 0}, {"key": "e1aad9da59a32a4443010b092eba1b68725c8467", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.47463115669312866, "ground_truth": 0}, {"key": "e1aad9da59a32a4443010b092eba1b68725c8467", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.3276683031002733, "ground_truth": 0}, {"key": "6897f34c8e510dc95524dbfceefe20717776f761", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.22815649061959087, "ground_truth": 0}, {"key": "6897f34c8e510dc95524dbfceefe20717776f761", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.29746995029544937, "ground_truth": 0}, {"key": "6897f34c8e510dc95524dbfceefe20717776f761", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.15921740076953203, "ground_truth": 0}, {"key": "6897f34c8e510dc95524dbfceefe20717776f761", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.11757213886333703, "ground_truth": 0}, {"key": "6897f34c8e510dc95524dbfceefe20717776f761", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.22953520750896292, "ground_truth": 0}, {"key": "c0846f0148c9fd60433c8d2bf85e3437b49f9ec4", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.6169358177047334, "ground_truth": 0}, {"key": "c0846f0148c9fd60433c8d2bf85e3437b49f9ec4", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.46295860360552, "ground_truth": 0}, {"key": "c0846f0148c9fd60433c8d2bf85e3437b49f9ec4", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.4590761311015252, "ground_truth": 0}, {"key": "c0846f0148c9fd60433c8d2bf85e3437b49f9ec4", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.3886180176519855, "ground_truth": 0}, {"key": "c0846f0148c9fd60433c8d2bf85e3437b49f9ec4", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.46879060269719114, "ground_truth": 0}, {"key": "dfbb5a2d5844f89537141a2b5a48040e68327010", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.760650656132355, "ground_truth": 0}, {"key": "dfbb5a2d5844f89537141a2b5a48040e68327010", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.611381953098745, "ground_truth": 0}, {"key": "dfbb5a2d5844f89537141a2b5a48040e68327010", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.5907792319127342, "ground_truth": 0}, {"key": "dfbb5a2d5844f89537141a2b5a48040e68327010", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.6150878497690776, "ground_truth": 0}, {"key": "dfbb5a2d5844f89537141a2b5a48040e68327010", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.7416740359196085, "ground_truth": 0}, {"key": "0aa0562353120d93357dc00a05ff4d2bc0312715", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.2295351777915501, "ground_truth": 0}, {"key": "0aa0562353120d93357dc00a05ff4d2bc0312715", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.1403362446307546, "ground_truth": 0}, {"key": "0aa0562353120d93357dc00a05ff4d2bc0312715", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.20689405717986464, "ground_truth": 0}, {"key": "0aa0562353120d93357dc00a05ff4d2bc0312715", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.19314737127618314, "ground_truth": 0}, {"key": "0aa0562353120d93357dc00a05ff4d2bc0312715", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.16885696188354452, "ground_truth": 0}, {"key": "fd5ae29a3ed2e9093c12dcbb12fcb5c67217b0f5", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.24653334702036353, "ground_truth": 0}, {"key": "fd5ae29a3ed2e9093c12dcbb12fcb5c67217b0f5", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.11596071078141014, "ground_truth": 0}, {"key": "fd5ae29a3ed2e9093c12dcbb12fcb5c67217b0f5", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.13939638241320884, "ground_truth": 0}, {"key": "fd5ae29a3ed2e9093c12dcbb12fcb5c67217b0f5", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.10669058946710705, "ground_truth": 0}, {"key": "fd5ae29a3ed2e9093c12dcbb12fcb5c67217b0f5", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.5621764961073219, "ground_truth": 0}, {"key": "4df7a53f5e24347a53d5bf3b8c92bef21561f2c4", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.5679366041926939, "ground_truth": 0}, {"key": "4df7a53f5e24347a53d5bf3b8c92bef21561f2c4", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.48438008429688734, "ground_truth": 0}, {"key": "4df7a53f5e24347a53d5bf3b8c92bef21561f2c4", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.4301473328037136, "ground_truth": 0}, {"key": "4df7a53f5e24347a53d5bf3b8c92bef21561f2c4", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.5602526435863613, "ground_truth": 0}, {"key": "4df7a53f5e24347a53d5bf3b8c92bef21561f2c4", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.6001883677808346, "ground_truth": 0}, {"key": "166fe0c3d3f400a48ec5fd716c675384512f152c", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.15203222960376153, "ground_truth": 0}, {"key": "166fe0c3d3f400a48ec5fd716c675384512f152c", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.2893716951016461, "ground_truth": 0}, {"key": "166fe0c3d3f400a48ec5fd716c675384512f152c", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.14223188224962505, "ground_truth": 0}, {"key": "166fe0c3d3f400a48ec5fd716c675384512f152c", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.09670579435070403, "ground_truth": 0}, {"key": "166fe0c3d3f400a48ec5fd716c675384512f152c", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.18594719083170094, "ground_truth": 0}, {"key": "69e313e0e6e7603f96a3783cb7d1ada68ace288f", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.7772998590576516, "ground_truth": 0}, {"key": "69e313e0e6e7603f96a3783cb7d1ada68ace288f", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.4843800606929061, "ground_truth": 0}, {"key": "69e313e0e6e7603f96a3783cb7d1ada68ace288f", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.32082131557450594, "ground_truth": 0}, {"key": "69e313e0e6e7603f96a3783cb7d1ada68ace288f", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.7799928977352745, "ground_truth": 0}, {"key": "69e313e0e6e7603f96a3783cb7d1ada68ace288f", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.5640984745924578, "ground_truth": 0}, {"key": "21ff7b91537b3ab2e73dff1f982a669b8658b0e9", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.5794004162692367, "ground_truth": 0}, {"key": "21ff7b91537b3ab2e73dff1f982a669b8658b0e9", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.35220174947273797, "ground_truth": 0}, {"key": "21ff7b91537b3ab2e73dff1f982a669b8658b0e9", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.6791786981713794, "ground_truth": 0}, {"key": "21ff7b91537b3ab2e73dff1f982a669b8658b0e9", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.5602526402452942, "ground_truth": 0}, {"key": "21ff7b91537b3ab2e73dff1f982a669b8658b0e9", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.6406358583186186, "ground_truth": 0}, {"key": "963cbc7820b42eaa7b7a82d178c6a387a70a6a3c", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.5794003904623283, "ground_truth": 0}, {"key": "963cbc7820b42eaa7b7a82d178c6a387a70a6a3c", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.6706082868480937, "ground_truth": 0}, {"key": "963cbc7820b42eaa7b7a82d178c6a387a70a6a3c", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.6020615705945003, "ground_truth": 0}, {"key": "963cbc7820b42eaa7b7a82d178c6a387a70a6a3c", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.8376199411158752, "ground_truth": 0}, {"key": "963cbc7820b42eaa7b7a82d178c6a387a70a6a3c", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.8766343715928122, "ground_truth": 0}, {"key": "8180a77657661e975e3fac6c7fdbd8de97fd160e", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.9597620624161818, "ground_truth": 0}, {"key": "8180a77657661e975e3fac6c7fdbd8de97fd160e", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.8376199799670998, "ground_truth": 0}, {"key": "8180a77657661e975e3fac6c7fdbd8de97fd160e", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.9799765572798037, "ground_truth": 0}, {"key": "8180a77657661e975e3fac6c7fdbd8de97fd160e", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.9381240142095371, "ground_truth": 0}, {"key": "8180a77657661e975e3fac6c7fdbd8de97fd160e", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.6893056035308551, "ground_truth": 0}, {"key": "6c498fd6de7ad5e5006732655050c1d97cc2af68", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.7041601287609641, "ground_truth": 0}, {"key": "6c498fd6de7ad5e5006732655050c1d97cc2af68", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.3468731090850086, "ground_truth": 0}, {"key": "6c498fd6de7ad5e5006732655050c1d97cc2af68", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.210766311178346, "ground_truth": 0}, {"key": "6c498fd6de7ad5e5006732655050c1d97cc2af68", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.22678363121687742, "ground_truth": 0}, {"key": "6c498fd6de7ad5e5006732655050c1d97cc2af68", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.06754669434618721, "ground_truth": 0}, {"key": "fdb54e157f8f4e5a479dbc6288587e52fffde33f", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.2613309215466072, "ground_truth": 0}, {"key": "fdb54e157f8f4e5a479dbc6288587e52fffde33f", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.23370635027436373, "ground_truth": 0}, {"key": "fdb54e157f8f4e5a479dbc6288587e52fffde33f", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.18952110157480068, "ground_truth": 0}, {"key": "fdb54e157f8f4e5a479dbc6288587e52fffde33f", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.43398145563903023, "ground_truth": 0}, {"key": "fdb54e157f8f4e5a479dbc6288587e52fffde33f", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.19930798996360768, "ground_truth": 0}, {"key": "fc8f0e54e2627ebe705735f0565d77ca64579d92", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.8267117871438006, "ground_truth": 0}, {"key": "fc8f0e54e2627ebe705735f0565d77ca64579d92", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.287767820844051, "ground_truth": 0}, {"key": "fc8f0e54e2627ebe705735f0565d77ca64579d92", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.3757064842247855, "ground_truth": 0}, {"key": "fc8f0e54e2627ebe705735f0565d77ca64579d92", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.6959583215701532, "ground_truth": 0}, {"key": "fc8f0e54e2627ebe705735f0565d77ca64579d92", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.3293917186331979, "ground_truth": 0}, {"key": "b000d4eac990440e136dc1e655a03d5669531d9b", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.13753246957782633, "ground_truth": 0}, {"key": "b000d4eac990440e136dc1e655a03d5669531d9b", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.2094696868168945, "ground_truth": 0}, {"key": "b000d4eac990440e136dc1e655a03d5669531d9b", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.40168780077238536, "ground_truth": 0}, {"key": "b000d4eac990440e136dc1e655a03d5669531d9b", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.17106119264379996, "ground_truth": 0}, {"key": "b000d4eac990440e136dc1e655a03d5669531d9b", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.28776778602238823, "ground_truth": 0}, {"key": "1064c47f3d7f0efa03368fe7eb01dd0836017339", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.4436004244763144, "ground_truth": 0}, {"key": "1064c47f3d7f0efa03368fe7eb01dd0836017339", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.18594719928318396, "ground_truth": 0}, {"key": "1064c47f3d7f0efa03368fe7eb01dd0836017339", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.1883239866573786, "ground_truth": 0}, {"key": "1064c47f3d7f0efa03368fe7eb01dd0836017339", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.1968262189338924, "ground_truth": 0}, {"key": "1064c47f3d7f0efa03368fe7eb01dd0836017339", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.25534363662474385, "ground_truth": 0}, {"key": "d79f1e9a2ddfcb61d80c944de53daebd4b5c7f6e", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.47463117009085054, "ground_truth": 0}, {"key": "d79f1e9a2ddfcb61d80c944de53daebd4b5c7f6e", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.4649015945058868, "ground_truth": 0}, {"key": "d79f1e9a2ddfcb61d80c944de53daebd4b5c7f6e", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.5097643862244061, "ground_truth": 0}, {"key": "d79f1e9a2ddfcb61d80c944de53daebd4b5c7f6e", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.5058591061774734, "ground_truth": 0}, {"key": "d79f1e9a2ddfcb61d80c944de53daebd4b5c7f6e", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.6460136902139876, "ground_truth": 0}, {"key": "87b5f1f872c849ec239bad4ccf487d048d4274b2", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.3007455836112025, "ground_truth": 0}, {"key": "87b5f1f872c849ec239bad4ccf487d048d4274b2", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.12336562160821161, "ground_truth": 0}, {"key": "87b5f1f872c849ec239bad4ccf487d048d4274b2", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.2766905390155977, "ground_truth": 0}, {"key": "87b5f1f872c849ec239bad4ccf487d048d4274b2", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.20946967769558464, "ground_truth": 0}, {"key": "87b5f1f872c849ec239bad4ccf487d048d4274b2", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.28616924253683856, "ground_truth": 0}, {"key": "9ea6d6a5cae86243c1c8899f7bab76e874c73b38", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.14511536045977397, "ground_truth": 0}, {"key": "9ea6d6a5cae86243c1c8899f7bab76e874c73b38", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.4765796622636868, "ground_truth": 0}, {"key": "9ea6d6a5cae86243c1c8899f7bab76e874c73b38", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.2309197651663405, "ground_truth": 0}, {"key": "9ea6d6a5cae86243c1c8899f7bab76e874c73b38", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.27825678309535296, "ground_truth": 0}, {"key": "9ea6d6a5cae86243c1c8899f7bab76e874c73b38", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.24508502876135327, "ground_truth": 0}, {"key": "a3cb529364dbdcd2af9e30ecfe56898be375870b", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.2120687916586079, "ground_truth": 0}, {"key": "a3cb529364dbdcd2af9e30ecfe56898be375870b", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.47073661647265264, "ground_truth": 0}, {"key": "a3cb529364dbdcd2af9e30ecfe56898be375870b", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.39606816686465207, "ground_truth": 0}, {"key": "a3cb529364dbdcd2af9e30ecfe56898be375870b", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.3504213955219065, "ground_truth": 0}, {"key": "a3cb529364dbdcd2af9e30ecfe56898be375870b", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.46295861681620276, "ground_truth": 0}, {"key": "f489b07406c653968a0ed21c00e28c9124e4a49b", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.7648916023675741, "ground_truth": 0}, {"key": "f489b07406c653968a0ed21c00e28c9124e4a49b", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.5983121927108392, "ground_truth": 0}, {"key": "f489b07406c653968a0ed21c00e28c9124e4a49b", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.8519527915417282, "ground_truth": 0}, {"key": "f489b07406c653968a0ed21c00e28c9124e4a49b", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.7279754544655576, "ground_truth": 0}, {"key": "f489b07406c653968a0ed21c00e28c9124e4a49b", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.5234203179904805, "ground_truth": 0}, {"key": "499fdb9bf024f6fbfd605792594372df22ec12f0", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.3923368092179219, "ground_truth": 0}, {"key": "499fdb9bf024f6fbfd605792594372df22ec12f0", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.3539862601228595, "ground_truth": 0}, {"key": "499fdb9bf024f6fbfd605792594372df22ec12f0", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.7371581718947461, "ground_truth": 0}, {"key": "499fdb9bf024f6fbfd605792594372df22ec12f0", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.41300356520615944, "ground_truth": 0}, {"key": "499fdb9bf024f6fbfd605792594372df22ec12f0", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.4016877947138386, "ground_truth": 0}, {"key": "9f49bf7ded4308f1601e4723d594d7c3b4883b32", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.42823339889264955, "ground_truth": 0}, {"key": "9f49bf7ded4308f1601e4723d594d7c3b4883b32", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.4225046332668465, "ground_truth": 0}, {"key": "9f49bf7ded4308f1601e4723d594d7c3b4883b32", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.40544874351658555, "ground_truth": 0}, {"key": "9f49bf7ded4308f1601e4723d594d7c3b4883b32", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.5467381576318793, "ground_truth": 0}, {"key": "9f49bf7ded4308f1601e4723d594d7c3b4883b32", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.5755880270924452, "ground_truth": 0}, {"key": "6bd843fe975d42b0f2d5eedb1a02d918e4a397f5", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.5156199227251916, "ground_truth": 0}, {"key": "6bd843fe975d42b0f2d5eedb1a02d918e4a397f5", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.494140897491361, "ground_truth": 0}, {"key": "6bd843fe975d42b0f2d5eedb1a02d918e4a397f5", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.6976089038878361, "ground_truth": 0}, {"key": "6bd843fe975d42b0f2d5eedb1a02d918e4a397f5", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.6976089153549887, "ground_truth": 0}, {"key": "6bd843fe975d42b0f2d5eedb1a02d918e4a397f5", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.6242935332399098, "ground_truth": 0}, {"key": "00aa8e3ba59f5fe71a096a5549f80faece10aa83", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.6334102629421486, "ground_truth": 0}, {"key": "00aa8e3ba59f5fe71a096a5549f80faece10aa83", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.7839884630382873, "ground_truth": 0}, {"key": "00aa8e3ba59f5fe71a096a5549f80faece10aa83", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.6113819659423806, "ground_truth": 0}, {"key": "00aa8e3ba59f5fe71a096a5549f80faece10aa83", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.5698526567203078, "ground_truth": 0}, {"key": "00aa8e3ba59f5fe71a096a5549f80faece10aa83", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.5370414013425631, "ground_truth": 0}, {"key": "bf0ea0373655184f69fb01b9aa833d21e7188e9e", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.13846178825823613, "ground_truth": 0}, {"key": "bf0ea0373655184f69fb01b9aa833d21e7188e9e", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.17328820664615585, "ground_truth": 0}, {"key": "bf0ea0373655184f69fb01b9aa833d21e7188e9e", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.3433417161804639, "ground_truth": 0}, {"key": "bf0ea0373655184f69fb01b9aa833d21e7188e9e", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.35220177187742646, "ground_truth": 0}, {"key": "bf0ea0373655184f69fb01b9aa833d21e7188e9e", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.16344543024888067, "ground_truth": 0}, {"key": "e1afe080ecf3565b0103214c21f49e8b03741024", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.66192287978208, "ground_truth": 0}, {"key": "e1afe080ecf3565b0103214c21f49e8b03741024", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.7106283125901046, "ground_truth": 0}, {"key": "e1afe080ecf3565b0103214c21f49e8b03741024", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.5448014006485811, "ground_truth": 0}, {"key": "e1afe080ecf3565b0103214c21f49e8b03741024", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.7401743695388264, "ground_truth": 0}, {"key": "e1afe080ecf3565b0103214c21f49e8b03741024", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.6224593413775442, "ground_truth": 0}, {"key": "05fa6152f08a3d64745030124428775768ee3afd", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.2974699276456891, "ground_truth": 0}, {"key": "05fa6152f08a3d64745030124428775768ee3afd", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.32939170632461956, "ground_truth": 0}, {"key": "05fa6152f08a3d64745030124428775768ee3afd", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.6169358404389955, "ground_truth": 0}, {"key": "05fa6152f08a3d64745030124428775768ee3afd", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.45326184303676825, "ground_truth": 0}, {"key": "05fa6152f08a3d64745030124428775768ee3afd", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.5755879819721257, "ground_truth": 0}, {"key": "8f80054060e5c2dde57666b5e3bddf6b70b34f3f", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.17895587614689326, "ground_truth": 0}, {"key": "8f80054060e5c2dde57666b5e3bddf6b70b34f3f", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.2267836380234832, "ground_truth": 0}, {"key": "8f80054060e5c2dde57666b5e3bddf6b70b34f3f", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.5292633780042255, "ground_truth": 0}, {"key": "8f80054060e5c2dde57666b5e3bddf6b70b34f3f", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.3073580374817309, "ground_truth": 0}, {"key": "8f80054060e5c2dde57666b5e3bddf6b70b34f3f", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.3191213863271725, "ground_truth": 0}, {"key": "f63877ffefceaf9a2a13a9277f4d861f9b9b8a73", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.5794004111940954, "ground_truth": 0}, {"key": "f63877ffefceaf9a2a13a9277f4d861f9b9b8a73", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.3106943534370152, "ground_truth": 0}, {"key": "f63877ffefceaf9a2a13a9277f4d861f9b9b8a73", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.5717665888851147, "ground_truth": 0}, {"key": "f63877ffefceaf9a2a13a9277f4d861f9b9b8a73", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.5234203499789296, "ground_truth": 0}, {"key": "f63877ffefceaf9a2a13a9277f4d861f9b9b8a73", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.5214711645851473, "ground_truth": 0}, {"key": "e1e0fbee1f5df559fda3830710afb660f33cb7b5", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.38676345960461167, "ground_truth": 0}, {"key": "e1e0fbee1f5df559fda3830710afb660f33cb7b5", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.40733339270417634, "ground_truth": 0}, {"key": "e1e0fbee1f5df559fda3830710afb660f33cb7b5", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.24077459564743614, "ground_truth": 0}, {"key": "e1e0fbee1f5df559fda3830710afb660f33cb7b5", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.5717666001661177, "ground_truth": 0}, {"key": "e1e0fbee1f5df559fda3830710afb660f33cb7b5", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.3793783893453079, "ground_truth": 0}, {"key": "7d66246dc75062c5616067bbb379962c3934e52f", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.10230471231175409, "ground_truth": 0}, {"key": "7d66246dc75062c5616067bbb379962c3934e52f", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.13477591084690665, "ground_truth": 0}, {"key": "7d66246dc75062c5616067bbb379962c3934e52f", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.2538610111112603, "ground_truth": 0}, {"key": "7d66246dc75062c5616067bbb379962c3934e52f", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.3191214057895184, "ground_truth": 0}, {"key": "7d66246dc75062c5616067bbb379962c3934e52f", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.12168575616942713, "ground_truth": 0}, {"key": "09e62b334425ef4eee26be483a625858c91340eb", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.4455295069615224, "ground_truth": 0}, {"key": "09e62b334425ef4eee26be483a625858c91340eb", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.6001883310314372, "ground_truth": 0}, {"key": "09e62b334425ef4eee26be483a625858c91340eb", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.4824291131627742, "ground_truth": 0}, {"key": "09e62b334425ef4eee26be483a625858c91340eb", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.5214711719966444, "ground_truth": 0}, {"key": "09e62b334425ef4eee26be483a625858c91340eb", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.5136684584603985, "ground_truth": 0}, {"key": "32e769b0ced3ffbf79f695af69a2401897156c8c", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.22815648010590417, "ground_truth": 0}, {"key": "32e769b0ced3ffbf79f695af69a2401897156c8c", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.29421495440094136, "ground_truth": 0}, {"key": "32e769b0ced3ffbf79f695af69a2401897156c8c", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.2146914296673902, "ground_truth": 0}, {"key": "32e769b0ced3ffbf79f695af69a2401897156c8c", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.13568954663658256, "ground_truth": 0}, {"key": "32e769b0ced3ffbf79f695af69a2401897156c8c", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.17441027784657417, "ground_truth": 0}, {"key": "43d42fe40ada4406377bc3b45c123a75552c21a0", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.34334175233341646, "ground_truth": 0}, {"key": "43d42fe40ada4406377bc3b45c123a75552c21a0", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.13660838383413154, "ground_truth": 0}, {"key": "43d42fe40ada4406377bc3b45c123a75552c21a0", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.5698526625146682, "ground_truth": 0}, {"key": "43d42fe40ada4406377bc3b45c123a75552c21a0", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.3468730624180867, "ground_truth": 0}, {"key": "43d42fe40ada4406377bc3b45c123a75552c21a0", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.07921032164055469, "ground_truth": 0}, {"key": "cec3e977a612e1481913d63934cfe578b9bcf3be", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.17895587975655508, "ground_truth": 0}, {"key": "cec3e977a612e1481913d63934cfe578b9bcf3be", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.18242552348851315, "ground_truth": 0}, {"key": "cec3e977a612e1481913d63934cfe578b9bcf3be", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.14033624672220718, "ground_truth": 0}, {"key": "cec3e977a612e1481913d63934cfe578b9bcf3be", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.1023047082759096, "ground_truth": 0}, {"key": "cec3e977a612e1481913d63934cfe578b9bcf3be", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.10894504627529748, "ground_truth": 0}, {"key": "2572185d9544f23c4ad02aeac1ae8ab7828fb4be", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.5486735108450522, "ground_truth": 0}, {"key": "2572185d9544f23c4ad02aeac1ae8ab7828fb4be", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.525368827536003, "ground_truth": 0}, {"key": "2572185d9544f23c4ad02aeac1ae8ab7828fb4be", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.295839861239289, "ground_truth": 0}, {"key": "2572185d9544f23c4ad02aeac1ae8ab7828fb4be", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.6584174802589434, "ground_truth": 0}, {"key": "2572185d9544f23c4ad02aeac1ae8ab7828fb4be", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.7549149773059362, "ground_truth": 0}, {"key": "3cc7c9639fb87922cfac315fbb55641e671a3d99", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.04272219832135053, "ground_truth": 0}, {"key": "3cc7c9639fb87922cfac315fbb55641e671a3d99", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.42823342643990137, "ground_truth": 0}, {"key": "3cc7c9639fb87922cfac315fbb55641e671a3d99", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.06804042356389622, "ground_truth": 0}, {"key": "3cc7c9639fb87922cfac315fbb55641e671a3d99", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.051845466654872385, "ground_truth": 0}, {"key": "3cc7c9639fb87922cfac315fbb55641e671a3d99", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.06142403616032252, "ground_truth": 0}, {"key": "374ae10f9cbb0719c889321f880a0671892336e4", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.49218810380971256, "ground_truth": 0}, {"key": "374ae10f9cbb0719c889321f880a0671892336e4", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.4746311835843499, "ground_truth": 0}, {"key": "374ae10f9cbb0719c889321f880a0671892336e4", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.45713671507533227, "ground_truth": 0}, {"key": "374ae10f9cbb0719c889321f880a0671892336e4", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.3886180314318598, "ground_truth": 0}, {"key": "374ae10f9cbb0719c889321f880a0671892336e4", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.49804689889325837, "ground_truth": 0}, {"key": "89a7bb5a0b120c5b50e9145c8f8f9bea3a90371a", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.5214711636781603, "ground_truth": 0}, {"key": "89a7bb5a0b120c5b50e9145c8f8f9bea3a90371a", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.6876300012735987, "ground_truth": 0}, {"key": "89a7bb5a0b120c5b50e9145c8f8f9bea3a90371a", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.875786997428381, "ground_truth": 0}, {"key": "89a7bb5a0b120c5b50e9145c8f8f9bea3a90371a", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.5136684806895936, "ground_truth": 0}, {"key": "89a7bb5a0b120c5b50e9145c8f8f9bea3a90371a", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.6113819533025191, "ground_truth": 0}, {"key": "49d4ad731a44b7576e3e3271b1eee2f0219883c2", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.6566582681537633, "ground_truth": 0}, {"key": "49d4ad731a44b7576e3e3271b1eee2f0219883c2", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.7772998609983282, "ground_truth": 0}, {"key": "49d4ad731a44b7576e3e3271b1eee2f0219883c2", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.49414086542698166, "ground_truth": 0}, {"key": "49d4ad731a44b7576e3e3271b1eee2f0219883c2", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.6495785889664506, "ground_truth": 0}, {"key": "49d4ad731a44b7576e3e3271b1eee2f0219883c2", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.6791787046467269, "ground_truth": 0}, {"key": "ab3c9bac8bcfef89da719c4aba8ea4eee71e4daf", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.4186969049831133, "ground_truth": 0}, {"key": "ab3c9bac8bcfef89da719c4aba8ea4eee71e4daf", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.3684056772471951, "ground_truth": 0}, {"key": "ab3c9bac8bcfef89da719c4aba8ea4eee71e4daf", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.21337717470134937, "ground_truth": 0}, {"key": "ab3c9bac8bcfef89da719c4aba8ea4eee71e4daf", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.30404166600430765, "ground_truth": 0}, {"key": "ab3c9bac8bcfef89da719c4aba8ea4eee71e4daf", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.35398630085726246, "ground_truth": 0}, {"key": "eb8b1cf7cf4ab7ad23ef6094cfe69348563aecc8", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.21601151351246373, "ground_truth": 0}, {"key": "eb8b1cf7cf4ab7ad23ef6094cfe69348563aecc8", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.30735801155731823, "ground_truth": 0}, {"key": "eb8b1cf7cf4ab7ad23ef6094cfe69348563aecc8", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.23370636562091499, "ground_truth": 0}, {"key": "eb8b1cf7cf4ab7ad23ef6094cfe69348563aecc8", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.4092208211554543, "ground_truth": 0}, {"key": "eb8b1cf7cf4ab7ad23ef6094cfe69348563aecc8", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.22953522011990216, "ground_truth": 0}, {"key": "e944a5cbd4265e43f422c172b930a60b7de190cc", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.1755380805642819, "ground_truth": 0}, {"key": "e944a5cbd4265e43f422c172b930a60b7de190cc", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.1645164512286094, "ground_truth": 0}, {"key": "e944a5cbd4265e43f422c172b930a60b7de190cc", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.08389038075594084, "ground_truth": 0}, {"key": "e944a5cbd4265e43f422c172b930a60b7de190cc", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.11516222942685311, "ground_truth": 0}, {"key": "e944a5cbd4265e43f422c172b930a60b7de190cc", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.30569730974146914, "ground_truth": 0}, {"key": "ef96a6c54daaf4fef676a69305e26fa1d4788bdd", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.3793783757988122, "ground_truth": 0}, {"key": "ef96a6c54daaf4fef676a69305e26fa1d4788bdd", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.5428632671319076, "ground_truth": 0}, {"key": "ef96a6c54daaf4fef676a69305e26fa1d4788bdd", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.264358334575505, "ground_truth": 0}, {"key": "ef96a6c54daaf4fef676a69305e26fa1d4788bdd", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.17553806772470107, "ground_truth": 0}, {"key": "ef96a6c54daaf4fef676a69305e26fa1d4788bdd", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.2523840550565068, "ground_truth": 0}, {"key": "d9ec8c3e50de1d5af4524c26c6819e17b64090aa", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.23231016067358878, "ground_truth": 0}, {"key": "d9ec8c3e50de1d5af4524c26c6819e17b64090aa", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.3867634267483012, "ground_truth": 0}, {"key": "d9ec8c3e50de1d5af4524c26c6819e17b64090aa", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.25982563518219637, "ground_truth": 0}, {"key": "d9ec8c3e50de1d5af4524c26c6819e17b64090aa", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.24364245187304762, "ground_truth": 0}, {"key": "d9ec8c3e50de1d5af4524c26c6819e17b64090aa", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.29098087224289615, "ground_truth": 0}, {"key": "b6072611b97e8c19ba2d7e0dfce153f046dd629d", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.22270015839999108, "ground_truth": 0}, {"key": "b6072611b97e8c19ba2d7e0dfce153f046dd629d", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.34510529051766564, "ground_truth": 0}, {"key": "b6072611b97e8c19ba2d7e0dfce153f046dd629d", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.45326187264884216, "ground_truth": 0}, {"key": "b6072611b97e8c19ba2d7e0dfce153f046dd629d", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.3684056860166693, "ground_truth": 0}, {"key": "b6072611b97e8c19ba2d7e0dfce153f046dd629d", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.14414884363060723, "ground_truth": 0}, {"key": "2cf81cee664ebcb027a48259e34e512a79aceecb", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.48438007053303506, "ground_truth": 0}, {"key": "2cf81cee664ebcb027a48259e34e512a79aceecb", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.36477754935240214, "ground_truth": 0}, {"key": "2cf81cee664ebcb027a48259e34e512a79aceecb", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.34687308805751915, "ground_truth": 0}, {"key": "2cf81cee664ebcb027a48259e34e512a79aceecb", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.3522017988364799, "ground_truth": 0}, {"key": "2cf81cee664ebcb027a48259e34e512a79aceecb", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.3757064526088952, "ground_truth": 0}, {"key": "b037b44fc06a2d89d95dc7b4453b87371a34fe2f", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.6531268985554696, "ground_truth": 0}, {"key": "b037b44fc06a2d89d95dc7b4453b87371a34fe2f", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.6876300012735987, "ground_truth": 0}, {"key": "b037b44fc06a2d89d95dc7b4453b87371a34fe2f", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.9840936090666991, "ground_truth": 0}, {"key": "b037b44fc06a2d89d95dc7b4453b87371a34fe2f", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.7490872129114715, "ground_truth": 0}, {"key": "b037b44fc06a2d89d95dc7b4453b87371a34fe2f", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.5389832050975722, "ground_truth": 0}, {"key": "b1ea881f21e2b58e247b5894d4f259cf86b4d1dd", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.6076631668825602, "ground_truth": 0}, {"key": "b1ea881f21e2b58e247b5894d4f259cf86b4d1dd", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.30074558767394244, "ground_truth": 0}, {"key": "b1ea881f21e2b58e247b5894d4f259cf86b4d1dd", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.4765796688427387, "ground_truth": 0}, {"key": "b1ea881f21e2b58e247b5894d4f259cf86b4d1dd", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.32252598154729323, "ground_truth": 0}, {"key": "b1ea881f21e2b58e247b5894d4f259cf86b4d1dd", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.2200070830741005, "ground_truth": 0}, {"key": "d80e6a3be826df05df00a87f49cc426fd597f085", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.7233094644390449, "ground_truth": 0}, {"key": "d80e6a3be826df05df00a87f49cc426fd597f085", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.9695556503344426, "ground_truth": 0}, {"key": "d80e6a3be826df05df00a87f49cc426fd597f085", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.9600626863840822, "ground_truth": 0}, {"key": "d80e6a3be826df05df00a87f49cc426fd597f085", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.8469578395411543, "ground_truth": 0}, {"key": "d80e6a3be826df05df00a87f49cc426fd597f085", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.9863631658665177, "ground_truth": 0}, {"key": "05216d3837745866d393f0e07be7ba801dc330f6", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.6688802515952893, "ground_truth": 0}, {"key": "05216d3837745866d393f0e07be7ba801dc330f6", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.5214711514694502, "ground_truth": 0}, {"key": "05216d3837745866d393f0e07be7ba801dc330f6", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.5467381594114306, "ground_truth": 0}, {"key": "05216d3837745866d393f0e07be7ba801dc330f6", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.507811885566818, "ground_truth": 0}, {"key": "05216d3837745866d393f0e07be7ba801dc330f6", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.558327014243205, "ground_truth": 0}, {"key": "a204e3551445183cf53ae355e532a2db731c0c30", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.20817891880299347, "ground_truth": 0}, {"key": "a204e3551445183cf53ae355e532a2db731c0c30", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.1008786283535198, "ground_truth": 0}, {"key": "a204e3551445183cf53ae355e532a2db731c0c30", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.2798284932007532, "ground_truth": 0}, {"key": "a204e3551445183cf53ae355e532a2db731c0c30", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.3923368259125249, "ground_truth": 0}, {"key": "a204e3551445183cf53ae355e532a2db731c0c30", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.32939170654451205, "ground_truth": 0}, {"key": "047e7bc4c7ea5f7df08d4efc443ac8a3479649f1", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.5136684830301637, "ground_truth": 0}, {"key": "047e7bc4c7ea5f7df08d4efc443ac8a3479649f1", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.8116760258664728, "ground_truth": 0}, {"key": "047e7bc4c7ea5f7df08d4efc443ac8a3479649f1", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.7154239896314654, "ground_truth": 0}, {"key": "047e7bc4c7ea5f7df08d4efc443ac8a3479649f1", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.7634837901516726, "ground_truth": 0}, {"key": "047e7bc4c7ea5f7df08d4efc443ac8a3479649f1", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.8407825938591966, "ground_truth": 0}, {"key": "dee467e11f253e70ec843c45fb373da06eace6be", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.40922079819318613, "ground_truth": 0}, {"key": "dee467e11f253e70ec843c45fb373da06eace6be", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.7690802371404659, "ground_truth": 0}, {"key": "dee467e11f253e70ec843c45fb373da06eace6be", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.5679366066462361, "ground_truth": 0}, {"key": "dee467e11f253e70ec843c45fb373da06eace6be", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.7634837697637303, "ground_truth": 0}, {"key": "dee467e11f253e70ec843c45fb373da06eace6be", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.6370308001661611, "ground_truth": 0}, {"key": "054891b9199a73152564cc5be925250ea282bb00", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.4073333945782591, "ground_truth": 0}, {"key": "054891b9199a73152564cc5be925250ea282bb00", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.3056973279348365, "ground_truth": 0}, {"key": "054891b9199a73152564cc5be925250ea282bb00", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.15713686068447796, "ground_truth": 0}, {"key": "054891b9199a73152564cc5be925250ea282bb00", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.2379298659997601, "ground_truth": 0}, {"key": "054891b9199a73152564cc5be925250ea282bb00", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.09602549584972819, "ground_truth": 0}, {"key": "82a94cf607660eb67aac057e3f5028c4cae75abf", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.30569732520625753, "ground_truth": 0}, {"key": "82a94cf607660eb67aac057e3f5028c4cae75abf", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.22815651342696605, "ground_truth": 0}, {"key": "82a94cf607660eb67aac057e3f5028c4cae75abf", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.2674081672760994, "ground_truth": 0}, {"key": "82a94cf607660eb67aac057e3f5028c4cae75abf", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.37387578250546194, "ground_truth": 0}, {"key": "82a94cf607660eb67aac057e3f5028c4cae75abf", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.5640984684773018, "ground_truth": 0}, {"key": "58bf14c936eb7e9a6561599014fefd77ef6c457e", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.3867634472668013, "ground_truth": 0}, {"key": "58bf14c936eb7e9a6561599014fefd77ef6c457e", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.8807970672739408, "ground_truth": 0}, {"key": "58bf14c936eb7e9a6561599014fefd77ef6c457e", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.6057990538384986, "ground_truth": 0}, {"key": "58bf14c936eb7e9a6561599014fefd77ef6c457e", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.5234203391616943, "ground_truth": 0}, {"key": "58bf14c936eb7e9a6561599014fefd77ef6c457e", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.5409238912892121, "ground_truth": 0}, {"key": "5574fe023e3127f0c206ac89eb06abf5a7400438", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.1329642456363214, "ground_truth": 0}, {"key": "5574fe023e3127f0c206ac89eb06abf5a7400438", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.4186969038882371, "ground_truth": 0}, {"key": "5574fe023e3127f0c206ac89eb06abf5a7400438", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.15507847012658416, "ground_truth": 0}, {"key": "5574fe023e3127f0c206ac89eb06abf5a7400438", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.13206616992752218, "ground_truth": 0}, {"key": "5574fe023e3127f0c206ac89eb06abf5a7400438", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.09602548072314392, "ground_truth": 0}, {"key": "e88be1fa30cb6557d422788b5c469b7ba7ca8bfc", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.11436852106703776, "ground_truth": 0}, {"key": "e88be1fa30cb6557d422788b5c469b7ba7ca8bfc", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.42823338770461744, "ground_truth": 0}, {"key": "e88be1fa30cb6557d422788b5c469b7ba7ca8bfc", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.07585818483923344, "ground_truth": 0}, {"key": "e88be1fa30cb6557d422788b5c469b7ba7ca8bfc", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.19930799745859104, "ground_truth": 0}, {"key": "e88be1fa30cb6557d422788b5c469b7ba7ca8bfc", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.32594954558635636, "ground_truth": 0}, {"key": "62f05476ec5198ceb345ce4f45d7d0e70f499ad7", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.08210662721070322, "ground_truth": 0}, {"key": "62f05476ec5198ceb345ce4f45d7d0e70f499ad7", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.17106117781161684, "ground_truth": 0}, {"key": "62f05476ec5198ceb345ce4f45d7d0e70f499ad7", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.12085323178676566, "ground_truth": 0}, {"key": "62f05476ec5198ceb345ce4f45d7d0e70f499ad7", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.23510837168487822, "ground_truth": 0}, {"key": "62f05476ec5198ceb345ce4f45d7d0e70f499ad7", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.19436780968878764, "ground_truth": 0}, {"key": "8cc719f761556a81a71c2dd1b703749c2059df10", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.5273165554972963, "ground_truth": 0}, {"key": "8cc719f761556a81a71c2dd1b703749c2059df10", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.5945512663779756, "ground_truth": 0}, {"key": "8cc719f761556a81a71c2dd1b703749c2059df10", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.48047868282877954, "ground_truth": 0}, {"key": "8cc719f761556a81a71c2dd1b703749c2059df10", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.5058590965786286, "ground_truth": 0}, {"key": "8cc719f761556a81a71c2dd1b703749c2059df10", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.7476159390096646, "ground_truth": 0}, {"key": "2d89b0d0827a0a1e9e855de7717407cdff63b1f5", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.35756755121071215, "ground_truth": 0}, {"key": "2d89b0d0827a0a1e9e855de7717407cdff63b1f5", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.7090191308576465, "ground_truth": 0}, {"key": "2d89b0d0827a0a1e9e855de7717407cdff63b1f5", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.34864512215774435, "ground_truth": 0}, {"key": "2d89b0d0827a0a1e9e855de7717407cdff63b1f5", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.7279754663969189, "ground_truth": 0}, {"key": "2d89b0d0827a0a1e9e855de7717407cdff63b1f5", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.28937171246071824, "ground_truth": 0}, {"key": "41431356e1e7c6f94057b262cd284987f9edb184", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.15921742370030229, "ground_truth": 0}, {"key": "41431356e1e7c6f94057b262cd284987f9edb184", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.14511537425730317, "ground_truth": 0}, {"key": "41431356e1e7c6f94057b262cd284987f9edb184", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.17781087092491454, "ground_truth": 0}, {"key": "41431356e1e7c6f94057b262cd284987f9edb184", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.3849121308771285, "ground_truth": 0}, {"key": "41431356e1e7c6f94057b262cd284987f9edb184", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.28616925401236487, "ground_truth": 0}, {"key": "50872fa30632af8f4c65fb9f952ea8e1b13043c9", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.4186968993884799, "ground_truth": 0}, {"key": "50872fa30632af8f4c65fb9f952ea8e1b13043c9", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.27982848543207955, "ground_truth": 0}, {"key": "50872fa30632af8f4c65fb9f952ea8e1b13043c9", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.1384617926403426, "ground_truth": 0}, {"key": "50872fa30632af8f4c65fb9f952ea8e1b13043c9", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.29910519827570825, "ground_truth": 0}, {"key": "50872fa30632af8f4c65fb9f952ea8e1b13043c9", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.2782567816729796, "ground_truth": 0}, {"key": "4a403faad8116c40f4cb960d3ffad081106341ad", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.31912139218173297, "ground_truth": 0}, {"key": "4a403faad8116c40f4cb960d3ffad081106341ad", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.2658804628602686, "ground_truth": 0}, {"key": "4a403faad8116c40f4cb960d3ffad081106341ad", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.2005576749350084, "ground_truth": 0}, {"key": "4a403faad8116c40f4cb960d3ffad081106341ad", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.27982847630213564, "ground_truth": 0}, {"key": "4a403faad8116c40f4cb960d3ffad081106341ad", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.15713685698857477, "ground_truth": 0}, {"key": "6f6964470c122807573653173b45b8e00bb59696", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.6531269378244942, "ground_truth": 0}, {"key": "6f6964470c122807573653173b45b8e00bb59696", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.13206615675681263, "ground_truth": 0}, {"key": "6f6964470c122807573653173b45b8e00bb59696", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.482429127604375, "ground_truth": 0}, {"key": "6f6964470c122807573653173b45b8e00bb59696", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.3123700046516203, "ground_truth": 0}, {"key": "6f6964470c122807573653173b45b8e00bb59696", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.30902370743591673, "ground_truth": 0}, {"key": "75c6e27a38b72bb9f75fa2b8e45e933bae10dac5", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.3757064668323577, "ground_truth": 0}, {"key": "75c6e27a38b72bb9f75fa2b8e45e933bae10dac5", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.3007455715242554, "ground_truth": 0}, {"key": "75c6e27a38b72bb9f75fa2b8e45e933bae10dac5", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.39606816080084123, "ground_truth": 0}, {"key": "75c6e27a38b72bb9f75fa2b8e45e933bae10dac5", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.3345894426209636, "ground_truth": 0}, {"key": "75c6e27a38b72bb9f75fa2b8e45e933bae10dac5", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.3276683042569725, "ground_truth": 0}, {"key": "9aa6463127d1efcba4403a185b29849a3688db8d", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.616935833312946, "ground_truth": 0}, {"key": "9aa6463127d1efcba4403a185b29849a3688db8d", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.32082129493068434, "ground_truth": 0}, {"key": "9aa6463127d1efcba4403a185b29849a3688db8d", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.24364244986630418, "ground_truth": 0}, {"key": "9aa6463127d1efcba4403a185b29849a3688db8d", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.33111974268192124, "ground_truth": 0}, {"key": "9aa6463127d1efcba4403a185b29849a3688db8d", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.32766827484448835, "ground_truth": 0}, {"key": "97eda06b374f07cd9495962465775bde7d44da31", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.2782568010185064, "ground_truth": 0}, {"key": "97eda06b374f07cd9495962465775bde7d44da31", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.22000710863098935, "ground_truth": 0}, {"key": "97eda06b374f07cd9495962465775bde7d44da31", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.4320633997356871, "ground_truth": 0}, {"key": "97eda06b374f07cd9495962465775bde7d44da31", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.5312094151232706, "ground_truth": 0}, {"key": "97eda06b374f07cd9495962465775bde7d44da31", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.3886180135048793, "ground_truth": 0}, {"key": "99a6049d67c1cee35f9703ccb8e6f62a4928295a", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.14318769446888494, "ground_truth": 0}, {"key": "99a6049d67c1cee35f9703ccb8e6f62a4928295a", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.17895588629440135, "ground_truth": 0}, {"key": "99a6049d67c1cee35f9703ccb8e6f62a4928295a", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.17217184529471763, "ground_truth": 0}, {"key": "99a6049d67c1cee35f9703ccb8e6f62a4928295a", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.3023910950698122, "ground_truth": 0}, {"key": "99a6049d67c1cee35f9703ccb8e6f62a4928295a", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.2583259879634771, "ground_truth": 0}, {"key": "adcb3e7b4bef0f9efe7a838b56131ca99b587743", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.1699562313099712, "ground_truth": 0}, {"key": "adcb3e7b4bef0f9efe7a838b56131ca99b587743", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.07921032058275097, "ground_truth": 0}, {"key": "adcb3e7b4bef0f9efe7a838b56131ca99b587743", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.27048023288821443, "ground_truth": 0}, {"key": "adcb3e7b4bef0f9efe7a838b56131ca99b587743", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.1623800279040395, "ground_truth": 0}, {"key": "adcb3e7b4bef0f9efe7a838b56131ca99b587743", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.16132024495763622, "ground_truth": 0}, {"key": "bf7cc4e7872b7471a8ef858b8aa45eca090171da", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.4629586240420974, "ground_truth": 0}, {"key": "bf7cc4e7872b7471a8ef858b8aa45eca090171da", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.411110866170368, "ground_truth": 0}, {"key": "bf7cc4e7872b7471a8ef858b8aa45eca090171da", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.42441203381743114, "ground_truth": 0}, {"key": "bf7cc4e7872b7471a8ef858b8aa45eca090171da", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.40168780271555315, "ground_truth": 0}, {"key": "bf7cc4e7872b7471a8ef858b8aa45eca090171da", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.21337717536535797, "ground_truth": 0}, {"key": "62785b99e4007fad95ce55d427046e14aef476a4", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.6859494755393116, "ground_truth": 0}, {"key": "62785b99e4007fad95ce55d427046e14aef476a4", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.27202455461002534, "ground_truth": 0}, {"key": "62785b99e4007fad95ce55d427046e14aef476a4", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.36658975065103505, "ground_truth": 0}, {"key": "62785b99e4007fad95ce55d427046e14aef476a4", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.6992544276172818, "ground_truth": 0}, {"key": "62785b99e4007fad95ce55d427046e14aef476a4", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.4513265228505729, "ground_truth": 0}, {"key": "62fcd4ca096a182c292ae3609444bbc7af15eab6", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.23510839730343364, "ground_truth": 0}, {"key": "62fcd4ca096a182c292ae3609444bbc7af15eab6", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.2689414155682686, "ground_truth": 0}, {"key": "62fcd4ca096a182c292ae3609444bbc7af15eab6", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.29910516665293935, "ground_truth": 0}, {"key": "62fcd4ca096a182c292ae3609444bbc7af15eab6", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.30902372008035894, "ground_truth": 0}, {"key": "62fcd4ca096a182c292ae3609444bbc7af15eab6", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.3793783503935713, "ground_truth": 0}, {"key": "afdbd1bc7c79a936601b3c6cae4622464641d3a5", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.4765796682174354, "ground_truth": 0}, {"key": "afdbd1bc7c79a936601b3c6cae4622464641d3a5", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.7994423064990532, "ground_truth": 0}, {"key": "afdbd1bc7c79a936601b3c6cae4622464641d3a5", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.4980468698764546, "ground_truth": 0}, {"key": "afdbd1bc7c79a936601b3c6cae4622464641d3a5", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.2240554422552867, "ground_truth": 0}, {"key": "afdbd1bc7c79a936601b3c6cae4622464641d3a5", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.3593641477023441, "ground_truth": 0}, {"key": "2a2a0fd7b85ec6f9145761795bae420d7eb84f44", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.5583270075830769, "ground_truth": 0}, {"key": "2a2a0fd7b85ec6f9145761795bae420d7eb84f44", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.7138307454017743, "ground_truth": 0}, {"key": "2a2a0fd7b85ec6f9145761795bae420d7eb84f44", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.6315942800923757, "ground_truth": 0}, {"key": "2a2a0fd7b85ec6f9145761795bae420d7eb84f44", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.7090191514968746, "ground_truth": 0}, {"key": "2a2a0fd7b85ec6f9145761795bae420d7eb84f44", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.5078118717728914, "ground_truth": 0}, {"key": "f3d07208d0059d738fc7788a4ce813309b677d7b", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.5, "ground_truth": 0}, {"key": "f3d07208d0059d738fc7788a4ce813309b677d7b", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.42441199296763227, "ground_truth": 0}, {"key": "f3d07208d0059d738fc7788a4ce813309b677d7b", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.3259495013368767, "ground_truth": 0}, {"key": "f3d07208d0059d738fc7788a4ce813309b677d7b", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.4320633875552796, "ground_truth": 0}, {"key": "f3d07208d0059d738fc7788a4ce813309b677d7b", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.5097643577408488, "ground_truth": 0}, {"key": "2b8840981769a4a8f93d2e82e609ab169165cd3c", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.3363310587385556, "ground_truth": 0}, {"key": "2b8840981769a4a8f93d2e82e609ab169165cd3c", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.27048022171025293, "ground_truth": 0}, {"key": "2b8840981769a4a8f93d2e82e609ab169165cd3c", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.5058590820847462, "ground_truth": 0}, {"key": "2b8840981769a4a8f93d2e82e609ab169165cd3c", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.334589430837974, "ground_truth": 0}, {"key": "2b8840981769a4a8f93d2e82e609ab169165cd3c", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.3311197230330366, "ground_truth": 0}, {"key": "4b23ce1db7253bf118b493c9bea7d6899012cc88", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.1441488613520697, "ground_truth": 0}, {"key": "4b23ce1db7253bf118b493c9bea7d6899012cc88", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.26435835365152577, "ground_truth": 0}, {"key": "4b23ce1db7253bf118b493c9bea7d6899012cc88", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.12678517525141558, "ground_truth": 0}, {"key": "4b23ce1db7253bf118b493c9bea7d6899012cc88", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.22541662656120487, "ground_truth": 0}, {"key": "4b23ce1db7253bf118b493c9bea7d6899012cc88", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.21076632565468043, "ground_truth": 0}, {"key": "c220780a60f76cdd1f6fd9a84abac736c3ee8ace", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.4092208208569827, "ground_truth": 0}, {"key": "c220780a60f76cdd1f6fd9a84abac736c3ee8ace", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.41869690212416866, "ground_truth": 0}, {"key": "c220780a60f76cdd1f6fd9a84abac736c3ee8ace", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.21076628559877075, "ground_truth": 0}, {"key": "c220780a60f76cdd1f6fd9a84abac736c3ee8ace", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.37204878856525586, "ground_truth": 0}, {"key": "c220780a60f76cdd1f6fd9a84abac736c3ee8ace", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.5964331562412343, "ground_truth": 0}, {"key": "9c7687a36469fc0e2203edb31f303274a611fb12", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.28140561440485695, "ground_truth": 0}, {"key": "9c7687a36469fc0e2203edb31f303274a611fb12", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.16451644930864434, "ground_truth": 0}, {"key": "9c7687a36469fc0e2203edb31f303274a611fb12", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.06325051813788718, "ground_truth": 0}, {"key": "9c7687a36469fc0e2203edb31f303274a611fb12", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.16451644356382356, "ground_truth": 0}, {"key": "9c7687a36469fc0e2203edb31f303274a611fb12", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.16667540223742439, "ground_truth": 0}, {"key": "8ab7fe3b19bb45c977cb74ed675579a20611ad9b", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.6242935202574547, "ground_truth": 0}, {"key": "8ab7fe3b19bb45c977cb74ed675579a20611ad9b", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.5736783894463136, "ground_truth": 0}, {"key": "8ab7fe3b19bb45c977cb74ed675579a20611ad9b", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.5640984841314568, "ground_truth": 0}, {"key": "8ab7fe3b19bb45c977cb74ed675579a20611ad9b", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.28140563272066776, "ground_truth": 0}, {"key": "8ab7fe3b19bb45c977cb74ed675579a20611ad9b", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.4980468796804622, "ground_truth": 0}, {"key": "dfedf6786976733d8e33e7848ea8a7aa735bbcab", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.21206881533568392, "ground_truth": 0}, {"key": "dfedf6786976733d8e33e7848ea8a7aa735bbcab", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.10302442916943161, "ground_truth": 0}, {"key": "dfedf6786976733d8e33e7848ea8a7aa735bbcab", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.1375324573401765, "ground_truth": 0}, {"key": "dfedf6786976733d8e33e7848ea8a7aa735bbcab", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.12002562142085671, "ground_truth": 0}, {"key": "dfedf6786976733d8e33e7848ea8a7aa735bbcab", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.32594950360408853, "ground_truth": 0}, {"key": "825f58580dd78cdcc7fbc10a00807e043c7b4468", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.26133092542633607, "ground_truth": 0}, {"key": "825f58580dd78cdcc7fbc10a00807e043c7b4468", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.14706450826154432, "ground_truth": 0}, {"key": "825f58580dd78cdcc7fbc10a00807e043c7b4468", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.2766905034421788, "ground_truth": 0}, {"key": "825f58580dd78cdcc7fbc10a00807e043c7b4468", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.23091975601256903, "ground_truth": 0}, {"key": "825f58580dd78cdcc7fbc10a00807e043c7b4468", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.22270013260579832, "ground_truth": 0}, {"key": "8bd6dc9f3ebb23fe20f74c1956184064b5b95509", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.2568320051094162, "ground_truth": 0}, {"key": "8bd6dc9f3ebb23fe20f74c1956184064b5b95509", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.3867634267483012, "ground_truth": 0}, {"key": "8bd6dc9f3ebb23fe20f74c1956184064b5b95509", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.2056150364736242, "ground_truth": 0}, {"key": "8bd6dc9f3ebb23fe20f74c1956184064b5b95509", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.09739039783857793, "ground_truth": 0}, {"key": "8bd6dc9f3ebb23fe20f74c1956184064b5b95509", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.10302443393124057, "ground_truth": 0}, {"key": "a7f6d4487a3ba7c4fc29e9b410820891f4c4f086", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.6992544242063172, "ground_truth": 0}, {"key": "a7f6d4487a3ba7c4fc29e9b410820891f4c4f086", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.6825737331753041, "ground_truth": 0}, {"key": "a7f6d4487a3ba7c4fc29e9b410820891f4c4f086", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.6601724056839396, "ground_truth": 0}, {"key": "a7f6d4487a3ba7c4fc29e9b410820891f4c4f086", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.6654105466566145, "ground_truth": 0}, {"key": "a7f6d4487a3ba7c4fc29e9b410820891f4c4f086", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.6242935426247265, "ground_truth": 0}, {"key": "b27ad09982665477dacdb7d06a33134bf064dd8d", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.19806417063533985, "ground_truth": 0}, {"key": "b27ad09982665477dacdb7d06a33134bf064dd8d", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.3276682951672588, "ground_truth": 0}, {"key": "b27ad09982665477dacdb7d06a33134bf064dd8d", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.3398276325176952, "ground_truth": 0}, {"key": "b27ad09982665477dacdb7d06a33134bf064dd8d", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.23091975968254302, "ground_truth": 0}, {"key": "b27ad09982665477dacdb7d06a33134bf064dd8d", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.22405543691984567, "ground_truth": 0}, {"key": "905891c3a21e76ad63d63dfe55e569a4cab25583", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.28616924237536995, "ground_truth": 0}, {"key": "905891c3a21e76ad63d63dfe55e569a4cab25583", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.379378386095685, "ground_truth": 0}, {"key": "905891c3a21e76ad63d63dfe55e569a4cab25583", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.16344543641008547, "ground_truth": 0}, {"key": "905891c3a21e76ad63d63dfe55e569a4cab25583", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.30735803188023403, "ground_truth": 0}, {"key": "905891c3a21e76ad63d63dfe55e569a4cab25583", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.24220564754936982, "ground_truth": 0}, {"key": "626460b8ec58252c82ff5513aa754190332780aa", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.26435832212750876, "ground_truth": 0}, {"key": "626460b8ec58252c82ff5513aa754190332780aa", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.24653335111594593, "ground_truth": 0}, {"key": "626460b8ec58252c82ff5513aa754190332780aa", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.46879065275795373, "ground_truth": 0}, {"key": "626460b8ec58252c82ff5513aa754190332780aa", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.11436852731253419, "ground_truth": 0}, {"key": "626460b8ec58252c82ff5513aa754190332780aa", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.304041698397666, "ground_truth": 0}, {"key": "31d0ed7b1b8f65c6479fb35683d72de21d70796a", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.6619229044138969, "ground_truth": 0}, {"key": "31d0ed7b1b8f65c6479fb35683d72de21d70796a", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.8397339826552203, "ground_truth": 0}, {"key": "31d0ed7b1b8f65c6479fb35683d72de21d70796a", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.9637799425298107, "ground_truth": 0}, {"key": "31d0ed7b1b8f65c6479fb35683d72de21d70796a", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.6242935130728666, "ground_truth": 0}, {"key": "31d0ed7b1b8f65c6479fb35683d72de21d70796a", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.7563575532137956, "ground_truth": 0}, {"key": "b03ee4df6492038d0a1d99a1717d8ad8ccc06db3", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.5117165976962862, "ground_truth": 0}, {"key": "b03ee4df6492038d0a1d99a1717d8ad8ccc06db3", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.36658973626383967, "ground_truth": 0}, {"key": "b03ee4df6492038d0a1d99a1717d8ad8ccc06db3", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.41489883196442723, "ground_truth": 0}, {"key": "b03ee4df6492038d0a1d99a1717d8ad8ccc06db3", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.5448013766143179, "ground_truth": 0}, {"key": "b03ee4df6492038d0a1d99a1717d8ad8ccc06db3", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.4073334037731185, "ground_truth": 0}, {"key": "ad9abc78fb2de88267b854f2aed110e2a5b8c3f1", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.6020615753290788, "ground_truth": 0}, {"key": "ad9abc78fb2de88267b854f2aed110e2a5b8c3f1", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.8479677667396885, "ground_truth": 0}, {"key": "ad9abc78fb2de88267b854f2aed110e2a5b8c3f1", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.773216368347849, "ground_truth": 0}, {"key": "ad9abc78fb2de88267b854f2aed110e2a5b8c3f1", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.596433162328238, "ground_truth": 0}, {"key": "ad9abc78fb2de88267b854f2aed110e2a5b8c3f1", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.41679663100963665, "ground_truth": 0}, {"key": "75cc16a7ba1970ba791da4ba43e6220f37f47697", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.2365162178360769, "ground_truth": 0}, {"key": "75cc16a7ba1970ba791da4ba43e6220f37f47697", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.3259494932699873, "ground_truth": 0}, {"key": "75cc16a7ba1970ba791da4ba43e6220f37f47697", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.529263402251745, "ground_truth": 0}, {"key": "75cc16a7ba1970ba791da4ba43e6220f37f47697", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.332852314456676, "ground_truth": 0}, {"key": "75cc16a7ba1970ba791da4ba43e6220f37f47697", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.24220563506313972, "ground_truth": 0}, {"key": "fe9d63d0ed719a42735cadaf10e76416545f680c", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.1677633494404096, "ground_truth": 0}, {"key": "fe9d63d0ed719a42735cadaf10e76416545f680c", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.20055768120528117, "ground_truth": 0}, {"key": "fe9d63d0ed719a42735cadaf10e76416545f680c", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.2845760021258409, "ground_truth": 0}, {"key": "fe9d63d0ed719a42735cadaf10e76416545f680c", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.1789558831513756, "ground_truth": 0}, {"key": "fe9d63d0ed719a42735cadaf10e76416545f680c", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.258325992112165, "ground_truth": 0}, {"key": "1744093a3fea8b8de0777b1a228c3ba3e515d48e", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.17781086594278722, "ground_truth": 0}, {"key": "1744093a3fea8b8de0777b1a228c3ba3e515d48e", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.28776781470893237, "ground_truth": 0}, {"key": "1744093a3fea8b8de0777b1a228c3ba3e515d48e", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.3345894364433169, "ground_truth": 0}, {"key": "1744093a3fea8b8de0777b1a228c3ba3e515d48e", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.11436852944482882, "ground_truth": 0}, {"key": "1744093a3fea8b8de0777b1a228c3ba3e515d48e", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.20181322566951934, "ground_truth": 0}, {"key": "4929479f70e89deb22539e7d2caa6c33bbb0a14f", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.4493926735079878, "ground_truth": 0}, {"key": "4929479f70e89deb22539e7d2caa6c33bbb0a14f", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.3007455701251028, "ground_truth": 0}, {"key": "4929479f70e89deb22539e7d2caa6c33bbb0a14f", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.3867634434065988, "ground_truth": 0}, {"key": "4929479f70e89deb22539e7d2caa6c33bbb0a14f", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.3611647254065827, "ground_truth": 0}, {"key": "4929479f70e89deb22539e7d2caa6c33bbb0a14f", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.4130035497668794, "ground_truth": 0}, {"key": "4dd3bb1fe7a5b0d42f0df8d9e62b81c673475420", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.42250462879595724, "ground_truth": 0}, {"key": "4dd3bb1fe7a5b0d42f0df8d9e62b81c673475420", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.684264022914841, "ground_truth": 0}, {"key": "4dd3bb1fe7a5b0d42f0df8d9e62b81c673475420", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.5409238575260524, "ground_truth": 0}, {"key": "4dd3bb1fe7a5b0d42f0df8d9e62b81c673475420", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.5964331384660567, "ground_truth": 0}, {"key": "4dd3bb1fe7a5b0d42f0df8d9e62b81c673475420", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.38861805762728907, "ground_truth": 0}, {"key": "32f0c7b0845e88c7ff34bb9d358a86e029dc2261", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.490235585642359, "ground_truth": 0}, {"key": "32f0c7b0845e88c7ff34bb9d358a86e029dc2261", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.5736783894463136, "ground_truth": 0}, {"key": "32f0c7b0845e88c7ff34bb9d358a86e029dc2261", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.4785288367201688, "ground_truth": 0}, {"key": "32f0c7b0845e88c7ff34bb9d358a86e029dc2261", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.355774909170389, "ground_truth": 0}, {"key": "32f0c7b0845e88c7ff34bb9d358a86e029dc2261", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.4980468796804622, "ground_truth": 0}, {"key": "607ce3caeeac56d7c4250aaa161871535cd1251e", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.3242353953031989, "ground_truth": 0}, {"key": "607ce3caeeac56d7c4250aaa161871535cd1251e", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.4186968963516547, "ground_truth": 0}, {"key": "607ce3caeeac56d7c4250aaa161871535cd1251e", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.2509127996784271, "ground_truth": 0}, {"key": "607ce3caeeac56d7c4250aaa161871535cd1251e", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.49609384183977556, "ground_truth": 0}, {"key": "607ce3caeeac56d7c4250aaa161871535cd1251e", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.5273165273441536, "ground_truth": 0}, {"key": "7fb19f75d5d3feefeababf62d2ac91bf684a8038", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.20181321547408582, "ground_truth": 0}, {"key": "7fb19f75d5d3feefeababf62d2ac91bf684a8038", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.27982851158422173, "ground_truth": 0}, {"key": "7fb19f75d5d3feefeababf62d2ac91bf684a8038", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.24798742262183124, "ground_truth": 0}, {"key": "7fb19f75d5d3feefeababf62d2ac91bf684a8038", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.30074556485073317, "ground_truth": 0}, {"key": "7fb19f75d5d3feefeababf62d2ac91bf684a8038", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.34864513230424693, "ground_truth": 0}, {"key": "4a70f83728ee66801be719df00060cda4c25817f", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.13753246158184915, "ground_truth": 0}, {"key": "4a70f83728ee66801be719df00060cda4c25817f", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.09807930676690381, "ground_truth": 0}, {"key": "4a70f83728ee66801be719df00060cda4c25817f", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.1778108723483055, "ground_truth": 0}, {"key": "4a70f83728ee66801be719df00060cda4c25817f", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.1789558892685121, "ground_truth": 0}, {"key": "4a70f83728ee66801be719df00060cda4c25817f", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.14223189448800877, "ground_truth": 0}, {"key": "dcfc0e6ff732124026991e89d50727876f50351f", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.41869688900053564, "ground_truth": 0}, {"key": "dcfc0e6ff732124026991e89d50727876f50351f", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.5156199353924189, "ground_truth": 0}, {"key": "dcfc0e6ff732124026991e89d50727876f50351f", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.6477982161989263, "ground_truth": 0}, {"key": "dcfc0e6ff732124026991e89d50727876f50351f", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.5, "ground_truth": 0}, {"key": "dcfc0e6ff732124026991e89d50727876f50351f", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.6548947306943854, "ground_truth": 0}, {"key": "ace7f6d9e984397bda16bf441019f1584f036b2a", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.9990302480522895, "ground_truth": 0}, {"key": "ace7f6d9e984397bda16bf441019f1584f036b2a", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.9995326519196357, "ground_truth": 0}, {"key": "ace7f6d9e984397bda16bf441019f1584f036b2a", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.9992930943178331, "ground_truth": 0}, {"key": "ace7f6d9e984397bda16bf441019f1584f036b2a", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.9989474315212895, "ground_truth": 0}, {"key": "ace7f6d9e984397bda16bf441019f1584f036b2a", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.999363808741637, "ground_truth": 0}, {"key": "6f12c9d47e70bfa86d72685d018ddd1161157e8e", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.06804041965790629, "ground_truth": 0}, {"key": "6f12c9d47e70bfa86d72685d018ddd1161157e8e", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.12002562837606554, "ground_truth": 0}, {"key": "6f12c9d47e70bfa86d72685d018ddd1161157e8e", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.2146914128214323, "ground_truth": 0}, {"key": "6f12c9d47e70bfa86d72685d018ddd1161157e8e", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.09203286968565848, "ground_truth": 0}, {"key": "6f12c9d47e70bfa86d72685d018ddd1161157e8e", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.1276526296174203, "ground_truth": 0}, {"key": "b32b72e5cf9e133e5be33eccbb2dc9ab5578ae84", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.27669054697219464, "ground_truth": 0}, {"key": "b32b72e5cf9e133e5be33eccbb2dc9ab5578ae84", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.22135069189592627, "ground_truth": 0}, {"key": "b32b72e5cf9e133e5be33eccbb2dc9ab5578ae84", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.304041681178561, "ground_truth": 0}, {"key": "b32b72e5cf9e133e5be33eccbb2dc9ab5578ae84", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.49804686407664545, "ground_truth": 0}, {"key": "b32b72e5cf9e133e5be33eccbb2dc9ab5578ae84", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.19559408950119697, "ground_truth": 0}, {"key": "0ae5e35dc2844afc251d082d8d5ef4be8edce58c", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.5813030916519808, "ground_truth": 0}, {"key": "0ae5e35dc2844afc251d082d8d5ef4be8edce58c", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.7839884625362177, "ground_truth": 0}, {"key": "0ae5e35dc2844afc251d082d8d5ef4be8edce58c", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.8489721981866559, "ground_truth": 0}, {"key": "0ae5e35dc2844afc251d082d8d5ef4be8edce58c", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.7138307751572357, "ground_truth": 0}, {"key": "0ae5e35dc2844afc251d082d8d5ef4be8edce58c", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.7853085888804217, "ground_truth": 0}, {"key": "ffb817ce85d7c19720ebbf0b43b01d0da61e9c06", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.24944724545291, "ground_truth": 0}, {"key": "ffb817ce85d7c19720ebbf0b43b01d0da61e9c06", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.25982563896211064, "ground_truth": 0}, {"key": "ffb817ce85d7c19720ebbf0b43b01d0da61e9c06", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.2861692452716788, "ground_truth": 0}, {"key": "ffb817ce85d7c19720ebbf0b43b01d0da61e9c06", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.1451153681720567, "ground_truth": 0}, {"key": "ffb817ce85d7c19720ebbf0b43b01d0da61e9c06", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.23370634120318756, "ground_truth": 0}, {"key": "9bfd6a5beb4e8dec59ba6d805dc9349a401da51d", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.3979384238773139, "ground_truth": 0}, {"key": "9bfd6a5beb4e8dec59ba6d805dc9349a401da51d", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.3225259820445721, "ground_truth": 0}, {"key": "9bfd6a5beb4e8dec59ba6d805dc9349a401da51d", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.2583259778347139, "ground_truth": 0}, {"key": "9bfd6a5beb4e8dec59ba6d805dc9349a401da51d", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.22815651078938157, "ground_truth": 0}, {"key": "9bfd6a5beb4e8dec59ba6d805dc9349a401da51d", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.3647775811300594, "ground_truth": 0}, {"key": "dc7f4527bf654918c7a4bb19179949ecd5982c0f", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.7431680045385275, "ground_truth": 0}, {"key": "dc7f4527bf654918c7a4bb19179949ecd5982c0f", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.5640984756258306, "ground_truth": 0}, {"key": "dc7f4527bf654918c7a4bb19179949ecd5982c0f", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.5869964250095688, "ground_truth": 0}, {"key": "dc7f4527bf654918c7a4bb19179949ecd5982c0f", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.571766606975961, "ground_truth": 0}, {"key": "dc7f4527bf654918c7a4bb19179949ecd5982c0f", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.7563575766574844, "ground_truth": 0}, {"key": "c60e77736087bc85b372a28b4724aae6dcf0b052", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.06512754537998912, "ground_truth": 0}, {"key": "c60e77736087bc85b372a28b4724aae6dcf0b052", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.06656918469703159, "ground_truth": 0}, {"key": "c60e77736087bc85b372a28b4724aae6dcf0b052", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.21337717932941352, "ground_truth": 0}, {"key": "c60e77736087bc85b372a28b4724aae6dcf0b052", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.062331035774463875, "ground_truth": 0}, {"key": "c60e77736087bc85b372a28b4724aae6dcf0b052", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.07423136605715909, "ground_truth": 0}, {"key": "e0953e2de7cf286ac1d87a41c62e37f21b7c7564", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.3242354143207739, "ground_truth": 0}, {"key": "e0953e2de7cf286ac1d87a41c62e37f21b7c7564", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.15102780908819205, "ground_truth": 0}, {"key": "e0953e2de7cf286ac1d87a41c62e37f21b7c7564", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.31405051541422124, "ground_truth": 0}, {"key": "e0953e2de7cf286ac1d87a41c62e37f21b7c7564", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.1127954055655615, "ground_truth": 0}, {"key": "e0953e2de7cf286ac1d87a41c62e37f21b7c7564", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.5583269947165054, "ground_truth": 0}, {"key": "8b6f228661fd5f3170dc2c2e6b353e1d6c3859ec", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.07921032396425812, "ground_truth": 0}, {"key": "8b6f228661fd5f3170dc2c2e6b353e1d6c3859ec", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.18010666638204878, "ground_truth": 0}, {"key": "8b6f228661fd5f3170dc2c2e6b353e1d6c3859ec", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.6020615796469118, "ground_truth": 0}, {"key": "8b6f228661fd5f3170dc2c2e6b353e1d6c3859ec", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.17895587342902627, "ground_truth": 0}, {"key": "8b6f228661fd5f3170dc2c2e6b353e1d6c3859ec", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.1847675257672138, "ground_truth": 0}, {"key": "2f482e021caf07e2f07baf111c36d1587758f188", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.33982763110396336, "ground_truth": 0}, {"key": "2f482e021caf07e2f07baf111c36d1587758f188", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.2523840333057166, "ground_truth": 0}, {"key": "2f482e021caf07e2f07baf111c36d1587758f188", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.6859494742976843, "ground_truth": 0}, {"key": "2f482e021caf07e2f07baf111c36d1587758f188", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.1571368581040114, "ground_truth": 0}, {"key": "2f482e021caf07e2f07baf111c36d1587758f188", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.3157359684409612, "ground_truth": 0}, {"key": "dc8ce4207b91a323bf6e2fbab889efeed22aa428", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.30735801798684, "ground_truth": 0}, {"key": "dc8ce4207b91a323bf6e2fbab889efeed22aa428", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.3208212797882232, "ground_truth": 0}, {"key": "dc8ce4207b91a323bf6e2fbab889efeed22aa428", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.45326183725603675, "ground_truth": 0}, {"key": "dc8ce4207b91a323bf6e2fbab889efeed22aa428", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.329391727788039, "ground_truth": 0}, {"key": "dc8ce4207b91a323bf6e2fbab889efeed22aa428", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.4167966299876954, "ground_truth": 0}, {"key": "22a9005fe99c5dd536a4f41de4eb59d4f633ef9e", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.45326186627939763, "ground_truth": 0}, {"key": "22a9005fe99c5dd536a4f41de4eb59d4f633ef9e", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.5945512860735299, "ground_truth": 0}, {"key": "22a9005fe99c5dd536a4f41de4eb59d4f633ef9e", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.6297745896164492, "ground_truth": 0}, {"key": "22a9005fe99c5dd536a4f41de4eb59d4f633ef9e", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.5292633884887522, "ground_truth": 0}, {"key": "22a9005fe99c5dd536a4f41de4eb59d4f633ef9e", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.8104789178216483, "ground_truth": 0}, {"key": "1b00b2d2edef396855ad392f08a6e74550af569b", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.1919327687880058, "ground_truth": 0}, {"key": "1b00b2d2edef396855ad392f08a6e74550af569b", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.4111108835125654, "ground_truth": 0}, {"key": "1b00b2d2edef396855ad392f08a6e74550af569b", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.4649015593154777, "ground_truth": 0}, {"key": "1b00b2d2edef396855ad392f08a6e74550af569b", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.2295352186031767, "ground_truth": 0}, {"key": "1b00b2d2edef396855ad392f08a6e74550af569b", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.30902369097611165, "ground_truth": 0}, {"key": "9b43472077873c45e7f278418885ad028eb993e3", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.37937836583416773, "ground_truth": 0}, {"key": "9b43472077873c45e7f278418885ad028eb993e3", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.39047585796452816, "ground_truth": 0}, {"key": "9b43472077873c45e7f278418885ad028eb993e3", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.16451646622486898, "ground_truth": 0}, {"key": "9b43472077873c45e7f278418885ad028eb993e3", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.14223189467145533, "ground_truth": 0}, {"key": "9b43472077873c45e7f278418885ad028eb993e3", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.11047114622409145, "ground_truth": 0}, {"key": "281347d0e99bc099d6991a6a60e30dc13d558216", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.5253688037541492, "ground_truth": 0}, {"key": "281347d0e99bc099d6991a6a60e30dc13d558216", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.668880267987173, "ground_truth": 0}, {"key": "281347d0e99bc099d6991a6a60e30dc13d558216", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.5832033411495822, "ground_truth": 0}, {"key": "281347d0e99bc099d6991a6a60e30dc13d558216", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.370225424094009, "ground_truth": 0}, {"key": "281347d0e99bc099d6991a6a60e30dc13d558216", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.4186968947699854, "ground_truth": 0}, {"key": "703d248cce913a6036347aabd2ba011a7f660bf4", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.3040416986913748, "ground_truth": 0}, {"key": "703d248cce913a6036347aabd2ba011a7f660bf4", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.1666754124803774, "ground_truth": 0}, {"key": "703d248cce913a6036347aabd2ba011a7f660bf4", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.4960938195595112, "ground_truth": 0}, {"key": "703d248cce913a6036347aabd2ba011a7f660bf4", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.31236998438712926, "ground_truth": 0}, {"key": "703d248cce913a6036347aabd2ba011a7f660bf4", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.188323970638606, "ground_truth": 0}, {"key": "517b86691dda04f41123354c1b7a7bfe1290eadc", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.3225259852697281, "ground_truth": 0}, {"key": "517b86691dda04f41123354c1b7a7bfe1290eadc", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.07751766116322842, "ground_truth": 0}, {"key": "517b86691dda04f41123354c1b7a7bfe1290eadc", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.16667539944177548, "ground_truth": 0}, {"key": "517b86691dda04f41123354c1b7a7bfe1290eadc", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.21469139933979542, "ground_truth": 0}, {"key": "517b86691dda04f41123354c1b7a7bfe1290eadc", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.23370636025768038, "ground_truth": 0}, {"key": "7b361feeebfb078b80831d40d2ad8640c361e049", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.35220175980487217, "ground_truth": 0}, {"key": "7b361feeebfb078b80831d40d2ad8640c361e049", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.2568319940055773, "ground_truth": 0}, {"key": "7b361feeebfb078b80831d40d2ad8640c361e049", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.34334170988452084, "ground_truth": 0}, {"key": "7b361feeebfb078b80831d40d2ad8640c361e049", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.2798284929762581, "ground_truth": 0}, {"key": "7b361feeebfb078b80831d40d2ad8640c361e049", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.3007455744901816, "ground_truth": 0}, {"key": "7d8e196095e4561ee4f01c650101f5591fce4a8d", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.237929884058667, "ground_truth": 0}, {"key": "7d8e196095e4561ee4f01c650101f5591fce4a8d", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.21866937663140684, "ground_truth": 0}, {"key": "7d8e196095e4561ee4f01c650101f5591fce4a8d", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.12002563209107886, "ground_truth": 0}, {"key": "7d8e196095e4561ee4f01c650101f5591fce4a8d", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.30902368968751276, "ground_truth": 0}, {"key": "7d8e196095e4561ee4f01c650101f5591fce4a8d", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.14128141499517896, "ground_truth": 0}, {"key": "ae03390949407f55c8d8f794896af3020d180b12", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.24220560666397845, "ground_truth": 0}, {"key": "ae03390949407f55c8d8f794896af3020d180b12", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.09807931628496279, "ground_truth": 0}, {"key": "ae03390949407f55c8d8f794896af3020d180b12", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.11516223271032065, "ground_truth": 0}, {"key": "ae03390949407f55c8d8f794896af3020d180b12", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.15610488487357668, "ground_truth": 0}, {"key": "ae03390949407f55c8d8f794896af3020d180b12", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.2043418906017188, "ground_truth": 0}, {"key": "4160464d3fcba547cb1664e54ce51ad06f78b773", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.3960681605025308, "ground_truth": 0}, {"key": "4160464d3fcba547cb1664e54ce51ad06f78b773", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.10158944033243457, "ground_truth": 0}, {"key": "4160464d3fcba547cb1664e54ce51ad06f78b773", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.36296923177452706, "ground_truth": 0}, {"key": "4160464d3fcba547cb1664e54ce51ad06f78b773", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.48047868712411956, "ground_truth": 0}, {"key": "4160464d3fcba547cb1664e54ce51ad06f78b773", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.307358015892911, "ground_truth": 0}, {"key": "72b396634cc46f29b5ef146a61073ee7e7fa3cdc", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.37387584227242043, "ground_truth": 0}, {"key": "72b396634cc46f29b5ef146a61073ee7e7fa3cdc", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.603931818570556, "ground_truth": 0}, {"key": "72b396634cc46f29b5ef146a61073ee7e7fa3cdc", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.5583270093743212, "ground_truth": 0}, {"key": "72b396634cc46f29b5ef146a61073ee7e7fa3cdc", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.537041381456328, "ground_truth": 0}, {"key": "72b396634cc46f29b5ef146a61073ee7e7fa3cdc", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.812867312862539, "ground_truth": 0}, {"key": "b9b09b290cdf4d74cb64684a6cae8b6832645607", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.7074047136506041, "ground_truth": 0}, {"key": "b9b09b290cdf4d74cb64684a6cae8b6832645607", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.5312094082108384, "ground_truth": 0}, {"key": "b9b09b290cdf4d74cb64684a6cae8b6832645607", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.851952793802963, "ground_truth": 0}, {"key": "b9b09b290cdf4d74cb64684a6cae8b6832645607", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.8244619250963118, "ground_truth": 0}, {"key": "b9b09b290cdf4d74cb64684a6cae8b6832645607", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.6976089178460114, "ground_truth": 0}, {"key": "9e49d58fa5ab7f3e4356cb61337605ac007c49ca", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.2213506998461637, "ground_truth": 0}, {"key": "9e49d58fa5ab7f3e4356cb61337605ac007c49ca", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.43974734731574777, "ground_truth": 0}, {"key": "9e49d58fa5ab7f3e4356cb61337605ac007c49ca", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.21469141860693974, "ground_truth": 0}, {"key": "9e49d58fa5ab7f3e4356cb61337605ac007c49ca", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.3738758280316087, "ground_truth": 0}, {"key": "9e49d58fa5ab7f3e4356cb61337605ac007c49ca", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.2254166099472881, "ground_truth": 0}, {"key": "47fe0e2bba8206014fb53a7d5247efd1e316e087", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.8816148916699329, "ground_truth": 0}, {"key": "47fe0e2bba8206014fb53a7d5247efd1e316e087", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.33285234353475884, "ground_truth": 0}, {"key": "47fe0e2bba8206014fb53a7d5247efd1e316e087", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.3468730870304942, "ground_truth": 0}, {"key": "47fe0e2bba8206014fb53a7d5247efd1e316e087", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.61508787697938, "ground_truth": 0}, {"key": "47fe0e2bba8206014fb53a7d5247efd1e316e087", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.38676343402608787, "ground_truth": 0}, {"key": "f54f84affaebd1d86011ad31adbf9fac4754a8f2", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.23792989475562246, "ground_truth": 0}, {"key": "f54f84affaebd1d86011ad31adbf9fac4754a8f2", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.4980468664297183, "ground_truth": 0}, {"key": "f54f84affaebd1d86011ad31adbf9fac4754a8f2", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.22270013989646456, "ground_truth": 0}, {"key": "f54f84affaebd1d86011ad31adbf9fac4754a8f2", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.40544871391326487, "ground_truth": 0}, {"key": "f54f84affaebd1d86011ad31adbf9fac4754a8f2", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.2613309336121608, "ground_truth": 0}, {"key": "bc4992871e25e6584936af456ad4b819dcc52f27", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.3040416751148808, "ground_truth": 0}, {"key": "bc4992871e25e6584936af456ad4b819dcc52f27", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.2893716682415908, "ground_truth": 0}, {"key": "bc4992871e25e6584936af456ad4b819dcc52f27", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.48438008800919513, "ground_truth": 0}, {"key": "bc4992871e25e6584936af456ad4b819dcc52f27", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.3415825054280064, "ground_truth": 0}, {"key": "bc4992871e25e6584936af456ad4b819dcc52f27", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.29421497942144903, "ground_truth": 0}, {"key": "271416bf0f15c52a4417339de78dcecf378b3950", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.5234203579152077, "ground_truth": 0}, {"key": "271416bf0f15c52a4417339de78dcecf378b3950", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.6706082960865816, "ground_truth": 0}, {"key": "271416bf0f15c52a4417339de78dcecf378b3950", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.5331543977409, "ground_truth": 0}, {"key": "271416bf0f15c52a4417339de78dcecf378b3950", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.5621764992291274, "ground_truth": 0}, {"key": "271416bf0f15c52a4417339de78dcecf378b3950", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.6706082866422723, "ground_truth": 0}, {"key": "0add6b43e18072837f0bef41031d6f92f740d625", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.44939263682746905, "ground_truth": 0}, {"key": "0add6b43e18072837f0bef41031d6f92f740d625", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.44746031365447236, "ground_truth": 0}, {"key": "0add6b43e18072837f0bef41031d6f92f740d625", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.2658804794846095, "ground_truth": 0}, {"key": "0add6b43e18072837f0bef41031d6f92f740d625", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.23651621864149694, "ground_truth": 0}, {"key": "0add6b43e18072837f0bef41031d6f92f740d625", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.4571367540558056, "ground_truth": 0}, {"key": "7060e3feb685bda7b5102e1cc8e9b35da37ca2a1", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.4513265128739381, "ground_truth": 0}, {"key": "7060e3feb685bda7b5102e1cc8e9b35da37ca2a1", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.2942149718023331, "ground_truth": 0}, {"key": "7060e3feb685bda7b5102e1cc8e9b35da37ca2a1", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.3106943659501976, "ground_truth": 0}, {"key": "7060e3feb685bda7b5102e1cc8e9b35da37ca2a1", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.20689406914341987, "ground_truth": 0}, {"key": "7060e3feb685bda7b5102e1cc8e9b35da37ca2a1", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.33982762211160583, "ground_truth": 0}, {"key": "04fbd3088e8610dd4d5bea709e7cc5ee3e53710d", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.2798284702240061, "ground_truth": 0}, {"key": "04fbd3088e8610dd4d5bea709e7cc5ee3e53710d", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.35756752107285145, "ground_truth": 0}, {"key": "04fbd3088e8610dd4d5bea709e7cc5ee3e53710d", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.17441026089908818, "ground_truth": 0}, {"key": "04fbd3088e8610dd4d5bea709e7cc5ee3e53710d", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.15713686044426073, "ground_truth": 0}, {"key": "04fbd3088e8610dd4d5bea709e7cc5ee3e53710d", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.136608393305485, "ground_truth": 0}, {"key": "b198f0356c0f0cb09aba4d7d5541dd7c5ce91678", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.51757088122097, "ground_truth": 0}, {"key": "b198f0356c0f0cb09aba4d7d5541dd7c5ce91678", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.684264022914841, "ground_truth": 0}, {"key": "b198f0356c0f0cb09aba4d7d5541dd7c5ce91678", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.45132653636698433, "ground_truth": 0}, {"key": "b198f0356c0f0cb09aba4d7d5541dd7c5ce91678", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.5195213469898994, "ground_truth": 0}, {"key": "b198f0356c0f0cb09aba4d7d5541dd7c5ce91678", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.38861805762728907, "ground_truth": 0}, {"key": "0f60442453e038c6bbe3aa525bedf2a97f459e04", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.2942149736491421, "ground_truth": 0}, {"key": "0f60442453e038c6bbe3aa525bedf2a97f459e04", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.8976952879257284, "ground_truth": 0}, {"key": "0f60442453e038c6bbe3aa525bedf2a97f459e04", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.4320633834875834, "ground_truth": 0}, {"key": "0f60442453e038c6bbe3aa525bedf2a97f459e04", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.6495786133178635, "ground_truth": 0}, {"key": "0f60442453e038c6bbe3aa525bedf2a97f459e04", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.2909808577764166, "ground_truth": 0}, {"key": "79b423b90af6b3381ebfa34a7382ca472bdb5b35", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.21733751523427022, "ground_truth": 0}, {"key": "79b423b90af6b3381ebfa34a7382ca472bdb5b35", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.29259529180547755, "ground_truth": 0}, {"key": "79b423b90af6b3381ebfa34a7382ca472bdb5b35", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.37204881494386866, "ground_truth": 0}, {"key": "79b423b90af6b3381ebfa34a7382ca472bdb5b35", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.305697329883383, "ground_truth": 0}, {"key": "79b423b90af6b3381ebfa34a7382ca472bdb5b35", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.25683199607404344, "ground_truth": 0}, {"key": "3e5a3a2dddee7ebebe57c12d0ace97a24cbabd72", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.23370637388879906, "ground_truth": 0}, {"key": "3e5a3a2dddee7ebebe57c12d0ace97a24cbabd72", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.22405543283484106, "ground_truth": 0}, {"key": "3e5a3a2dddee7ebebe57c12d0ace97a24cbabd72", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.29583987817079116, "ground_truth": 0}, {"key": "3e5a3a2dddee7ebebe57c12d0ace97a24cbabd72", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.14608724701001471, "ground_truth": 0}, {"key": "3e5a3a2dddee7ebebe57c12d0ace97a24cbabd72", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.16026603622605756, "ground_truth": 0}, {"key": "c623e4914c04811d354fa137e3bf7a00980ef7d7", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.27357439785789417, "ground_truth": 0}, {"key": "c623e4914c04811d354fa137e3bf7a00980ef7d7", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.20307463700172937, "ground_truth": 0}, {"key": "c623e4914c04811d354fa137e3bf7a00980ef7d7", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.4436004151046205, "ground_truth": 0}, {"key": "c623e4914c04811d354fa137e3bf7a00980ef7d7", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.11357959064721963, "ground_truth": 0}, {"key": "c623e4914c04811d354fa137e3bf7a00980ef7d7", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.26435835161652244, "ground_truth": 0}, {"key": "d5ef1fb6f2df20e46fb032b9e318bc8555283e78", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.21601154730305455, "ground_truth": 0}, {"key": "d5ef1fb6f2df20e46fb032b9e318bc8555283e78", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.5156199140085758, "ground_truth": 0}, {"key": "d5ef1fb6f2df20e46fb032b9e318bc8555283e78", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.24220565457407273, "ground_truth": 0}, {"key": "d5ef1fb6f2df20e46fb032b9e318bc8555283e78", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.18952109047400692, "ground_truth": 0}, {"key": "d5ef1fb6f2df20e46fb032b9e318bc8555283e78", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.3276683167583523, "ground_truth": 0}, {"key": "e1a36c50adadc5db9ffe6fd2c5e275d522902193", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.06608537458631081, "ground_truth": 0}, {"key": "e1a36c50adadc5db9ffe6fd2c5e275d522902193", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.10594828972376011, "ground_truth": 0}, {"key": "e1a36c50adadc5db9ffe6fd2c5e275d522902193", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.11279540152239283, "ground_truth": 0}, {"key": "e1a36c50adadc5db9ffe6fd2c5e275d522902193", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.18010667316274576, "ground_truth": 0}, {"key": "e1a36c50adadc5db9ffe6fd2c5e275d522902193", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.17328821383056048, "ground_truth": 0}, {"key": "bad69c9a3c7d84a4717705a3063dd7367243772b", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.47852882666974966, "ground_truth": 0}, {"key": "bad69c9a3c7d84a4717705a3063dd7367243772b", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.4359015107318489, "ground_truth": 0}, {"key": "bad69c9a3c7d84a4717705a3063dd7367243772b", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.5467381397291259, "ground_truth": 0}, {"key": "bad69c9a3c7d84a4717705a3063dd7367243772b", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.3611647451442394, "ground_truth": 0}, {"key": "bad69c9a3c7d84a4717705a3063dd7367243772b", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.3451052534563387, "ground_truth": 0}, {"key": "4b40ad1f0e59b139e9a1466859ee08a048ca8d2c", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.18594719656947276, "ground_truth": 0}, {"key": "4b40ad1f0e59b139e9a1466859ee08a048ca8d2c", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.08269734060402147, "ground_truth": 0}, {"key": "4b40ad1f0e59b139e9a1466859ee08a048ca8d2c", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.18010665650052116, "ground_truth": 0}, {"key": "4b40ad1f0e59b139e9a1466859ee08a048ca8d2c", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.12765261670468825, "ground_truth": 0}, {"key": "4b40ad1f0e59b139e9a1466859ee08a048ca8d2c", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.2018132129246599, "ground_truth": 0}, {"key": "c17a30b4c0f8f58e3afa6279a39470f65a179f6b", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.5621764899534933, "ground_truth": 0}, {"key": "c17a30b4c0f8f58e3afa6279a39470f65a179f6b", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.42441198046875805, "ground_truth": 0}, {"key": "c17a30b4c0f8f58e3afa6279a39470f65a179f6b", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.3363310581666909, "ground_truth": 0}, {"key": "c17a30b4c0f8f58e3afa6279a39470f65a179f6b", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.4339814792170742, "ground_truth": 0}, {"key": "c17a30b4c0f8f58e3afa6279a39470f65a179f6b", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.24364242128832828, "ground_truth": 0}, {"key": "6f579aad2d1f601b17e01057cd4b5e4942627230", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.5602526694139234, "ground_truth": 0}, {"key": "6f579aad2d1f601b17e01057cd4b5e4942627230", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.6992544104012044, "ground_truth": 0}, {"key": "6f579aad2d1f601b17e01057cd4b5e4942627230", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.794384953393159, "ground_truth": 0}, {"key": "6f579aad2d1f601b17e01057cd4b5e4942627230", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.7416740051796615, "ground_truth": 0}, {"key": "6f579aad2d1f601b17e01057cd4b5e4942627230", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.5964331444556479, "ground_truth": 0}, {"key": "7551f8e13485bb1738c16eccad343a14a47b2903", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.7122321821047737, "ground_truth": 0}, {"key": "7551f8e13485bb1738c16eccad343a14a47b2903", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.6671476835817202, "ground_truth": 0}, {"key": "7551f8e13485bb1738c16eccad343a14a47b2903", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.4571367265833999, "ground_truth": 0}, {"key": "7551f8e13485bb1738c16eccad343a14a47b2903", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.5253688120916966, "ground_truth": 0}, {"key": "7551f8e13485bb1738c16eccad343a14a47b2903", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.6808786254960296, "ground_truth": 0}, {"key": "257d8d38863175ec9401d0532963fb71a47f0734", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.4054487447522703, "ground_truth": 0}, {"key": "257d8d38863175ec9401d0532963fb71a47f0734", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.22270012729555394, "ground_truth": 0}, {"key": "257d8d38863175ec9401d0532963fb71a47f0734", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.38306416340120686, "ground_truth": 0}, {"key": "257d8d38863175ec9401d0532963fb71a47f0734", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.42250460819749547, "ground_truth": 0}, {"key": "257d8d38863175ec9401d0532963fb71a47f0734", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.27512973427440324, "ground_truth": 0}, {"key": "aa596e10dfe78dd875a7e15bfd53138bc8bde471", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.11436852206792268, "ground_truth": 0}, {"key": "aa596e10dfe78dd875a7e15bfd53138bc8bde471", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.1066905847089038, "ground_truth": 0}, {"key": "aa596e10dfe78dd875a7e15bfd53138bc8bde471", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.16776334030802872, "ground_truth": 0}, {"key": "aa596e10dfe78dd875a7e15bfd53138bc8bde471", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.19559408988523844, "ground_truth": 0}, {"key": "aa596e10dfe78dd875a7e15bfd53138bc8bde471", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.09268778727669427, "ground_truth": 0}, {"key": "a0dff972172125f32b79977a47b0d250be8f71e4", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.20055767202256017, "ground_truth": 0}, {"key": "a0dff972172125f32b79977a47b0d250be8f71e4", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.4359015402289115, "ground_truth": 0}, {"key": "a0dff972172125f32b79977a47b0d250be8f71e4", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.8539127552673832, "ground_truth": 0}, {"key": "a0dff972172125f32b79977a47b0d250be8f71e4", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.20946967429190233, "ground_truth": 0}, {"key": "a0dff972172125f32b79977a47b0d250be8f71e4", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.3345894380375143, "ground_truth": 0}, {"key": "faac3a6337907b1552b7068c8701cae665c4885c", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.4186969006202529, "ground_truth": 0}, {"key": "faac3a6337907b1552b7068c8701cae665c4885c", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.40168780958502415, "ground_truth": 0}, {"key": "faac3a6337907b1552b7068c8701cae665c4885c", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.28140562106025013, "ground_truth": 0}, {"key": "faac3a6337907b1552b7068c8701cae665c4885c", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.4073333884119487, "ground_truth": 0}, {"key": "faac3a6337907b1552b7068c8701cae665c4885c", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.4301473501793107, "ground_truth": 0}, {"key": "c741b211364d761605050776064a506d24378d10", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.5448014158603623, "ground_truth": 0}, {"key": "c741b211364d761605050776064a506d24378d10", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.3007455619268277, "ground_truth": 0}, {"key": "c741b211364d761605050776064a506d24378d10", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.2643583651738859, "ground_truth": 0}, {"key": "c741b211364d761605050776064a506d24378d10", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.4590761156753181, "ground_truth": 0}, {"key": "c741b211364d761605050776064a506d24378d10", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.1847675144190865, "ground_truth": 0}, {"key": "a062b8ba08369be2364a863020a28de63a3cbf86", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.5175708724269986, "ground_truth": 0}, {"key": "a062b8ba08369be2364a863020a28de63a3cbf86", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.29259529594189054, "ground_truth": 0}, {"key": "a062b8ba08369be2364a863020a28de63a3cbf86", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.33633104607265785, "ground_truth": 0}, {"key": "a062b8ba08369be2364a863020a28de63a3cbf86", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.2942149682372804, "ground_truth": 0}, {"key": "a062b8ba08369be2364a863020a28de63a3cbf86", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.5602526371020665, "ground_truth": 0}, {"key": "f11102404d23702fe398b1d690d13418703e617a", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.9005297880718229, "ground_truth": 0}, {"key": "f11102404d23702fe398b1d690d13418703e617a", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.8376199669549872, "ground_truth": 0}, {"key": "f11102404d23702fe398b1d690d13418703e617a", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.9429286018975628, "ground_truth": 0}, {"key": "f11102404d23702fe398b1d690d13418703e617a", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.9167080865567308, "ground_truth": 0}, {"key": "f11102404d23702fe398b1d690d13418703e617a", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.8449215367137101, "ground_truth": 0}, {"key": "62481fda7e7b9714b994617909349550707fe8a7", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.3998116398958614, "ground_truth": 0}, {"key": "62481fda7e7b9714b994617909349550707fe8a7", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.45713671975191283, "ground_truth": 0}, {"key": "62481fda7e7b9714b994617909349550707fe8a7", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.5888891398758285, "ground_truth": 0}, {"key": "62481fda7e7b9714b994617909349550707fe8a7", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.33285235148610265, "ground_truth": 0}, {"key": "62481fda7e7b9714b994617909349550707fe8a7", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.4804786852400688, "ground_truth": 0}, {"key": "13943ef2d9c3b737c9a900f0cdb32a9c39121e6f", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.5525397269462574, "ground_truth": 0}, {"key": "13943ef2d9c3b737c9a900f0cdb32a9c39121e6f", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.8824278618180653, "ground_truth": 0}, {"key": "13943ef2d9c3b737c9a900f0cdb32a9c39121e6f", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.7122321792244332, "ground_truth": 0}, {"key": "13943ef2d9c3b737c9a900f0cdb32a9c39121e6f", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.7577943761039876, "ground_truth": 0}, {"key": "13943ef2d9c3b737c9a900f0cdb32a9c39121e6f", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.709019142801782, "ground_truth": 0}, {"key": "0c25e0cd62589fde1b378606febbcc5a2bafc770", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.8539127609742935, "ground_truth": 0}, {"key": "0c25e0cd62589fde1b378606febbcc5a2bafc770", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.7879311932559049, "ground_truth": 0}, {"key": "0c25e0cd62589fde1b378606febbcc5a2bafc770", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.7759445460250327, "ground_truth": 0}, {"key": "0c25e0cd62589fde1b378606febbcc5a2bafc770", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.8824278596437349, "ground_truth": 0}, {"key": "0c25e0cd62589fde1b378606febbcc5a2bafc770", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.7476159464325776, "ground_truth": 0}, {"key": "a86bc16fad35d84e988af4cc64bf14877337d47e", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.44939264778297505, "ground_truth": 0}, {"key": "a86bc16fad35d84e988af4cc64bf14877337d47e", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.6001883773680091, "ground_truth": 0}, {"key": "a86bc16fad35d84e988af4cc64bf14877337d47e", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.4130035943969311, "ground_truth": 0}, {"key": "a86bc16fad35d84e988af4cc64bf14877337d47e", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.6513548754787469, "ground_truth": 0}, {"key": "a86bc16fad35d84e988af4cc64bf14877337d47e", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.4824291045480319, "ground_truth": 0}, {"key": "0f937bcc8cd07bab2d5aa9a4492d3c2430063b67", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.5117165875497928, "ground_truth": 0}, {"key": "0f937bcc8cd07bab2d5aa9a4492d3c2430063b67", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.40356682856308296, "ground_truth": 0}, {"key": "0f937bcc8cd07bab2d5aa9a4492d3c2430063b67", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.40168782374997775, "ground_truth": 0}, {"key": "0f937bcc8cd07bab2d5aa9a4492d3c2430063b67", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.3775406746230428, "ground_truth": 0}, {"key": "0f937bcc8cd07bab2d5aa9a4492d3c2430063b67", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.25683199948578983, "ground_truth": 0}, {"key": "a6c0617d92807f05f02d767261c45b616382e499", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.38491215399456463, "ground_truth": 0}, {"key": "a6c0617d92807f05f02d767261c45b616382e499", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.679178722207617, "ground_truth": 0}, {"key": "a6c0617d92807f05f02d767261c45b616382e499", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.3486451212788945, "ground_truth": 0}, {"key": "a6c0617d92807f05f02d767261c45b616382e499", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.6095241668340945, "ground_truth": 0}, {"key": "a6c0617d92807f05f02d767261c45b616382e499", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.4668456128427084, "ground_truth": 0}, {"key": "4f45a0576d353fa9b5b9d1c8e3cc0e6a1cd4897b", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.09807932643572186, "ground_truth": 0}, {"key": "4f45a0576d353fa9b5b9d1c8e3cc0e6a1cd4897b", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.43974733522801757, "ground_truth": 0}, {"key": "4f45a0576d353fa9b5b9d1c8e3cc0e6a1cd4897b", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.236516237898868, "ground_truth": 0}, {"key": "4f45a0576d353fa9b5b9d1c8e3cc0e6a1cd4897b", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.20689404070005663, "ground_truth": 0}, {"key": "4f45a0576d353fa9b5b9d1c8e3cc0e6a1cd4897b", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.586996436050159, "ground_truth": 0}, {"key": "f6d43a207c2b3c48e787087b345c23d2fb1dc92f", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.35756750045255475, "ground_truth": 0}, {"key": "f6d43a207c2b3c48e787087b345c23d2fb1dc92f", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.4339814984967969, "ground_truth": 0}, {"key": "f6d43a207c2b3c48e787087b345c23d2fb1dc92f", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.3007455762263385, "ground_truth": 0}, {"key": "f6d43a207c2b3c48e787087b345c23d2fb1dc92f", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.4668455980710346, "ground_truth": 0}, {"key": "f6d43a207c2b3c48e787087b345c23d2fb1dc92f", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.644225105647755, "ground_truth": 0}, {"key": "e0127487aee3a00fe164d72eb697221079518471", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.3522017985198074, "ground_truth": 0}, {"key": "e0127487aee3a00fe164d72eb697221079518471", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.4707366276241363, "ground_truth": 0}, {"key": "e0127487aee3a00fe164d72eb697221079518471", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.4726835018652525, "ground_truth": 0}, {"key": "e0127487aee3a00fe164d72eb697221079518471", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.3702253873159685, "ground_truth": 0}, {"key": "e0127487aee3a00fe164d72eb697221079518471", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.4111108584479187, "ground_truth": 0}, {"key": "2f3af8decce1c0a6cd22b21df96acd40b14bb62b", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.20946967398057223, "ground_truth": 0}, {"key": "2f3af8decce1c0a6cd22b21df96acd40b14bb62b", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.31405055943867227, "ground_truth": 0}, {"key": "2f3af8decce1c0a6cd22b21df96acd40b14bb62b", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.12678516531634537, "ground_truth": 0}, {"key": "2f3af8decce1c0a6cd22b21df96acd40b14bb62b", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.3123700182081158, "ground_truth": 0}, {"key": "2f3af8decce1c0a6cd22b21df96acd40b14bb62b", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.2030746416977451, "ground_truth": 0}, {"key": "13a366f303e6ea2f07c353a9f5fb49a44840f808", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.37754064726775355, "ground_truth": 0}, {"key": "13a366f303e6ea2f07c353a9f5fb49a44840f808", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.6976089170553491, "ground_truth": 0}, {"key": "13a366f303e6ea2f07c353a9f5fb49a44840f808", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.5583269908101963, "ground_truth": 0}, {"key": "13a366f303e6ea2f07c353a9f5fb49a44840f808", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.5, "ground_truth": 0}, {"key": "13a366f303e6ea2f07c353a9f5fb49a44840f808", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.8397339577746541, "ground_truth": 0}, {"key": "ee36a8b5db09b9e9a6d462116539ffc095d5c017", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.3486451428555418, "ground_truth": 0}, {"key": "ee36a8b5db09b9e9a6d462116539ffc095d5c017", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.30735802313352223, "ground_truth": 0}, {"key": "ee36a8b5db09b9e9a6d462116539ffc095d5c017", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.204341892985413, "ground_truth": 0}, {"key": "ee36a8b5db09b9e9a6d462116539ffc095d5c017", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.7041601645236866, "ground_truth": 0}, {"key": "ee36a8b5db09b9e9a6d462116539ffc095d5c017", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.6169358375253795, "ground_truth": 0}, {"key": "d3b3bcf90226a694361cb27f1a4d481c79b7368a", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.5389831846783167, "ground_truth": 0}, {"key": "d3b3bcf90226a694361cb27f1a4d481c79b7368a", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.3757064906366991, "ground_truth": 0}, {"key": "d3b3bcf90226a694361cb27f1a4d481c79b7368a", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.5253688186509475, "ground_truth": 0}, {"key": "d3b3bcf90226a694361cb27f1a4d481c79b7368a", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.5078118826787948, "ground_truth": 0}, {"key": "d3b3bcf90226a694361cb27f1a4d481c79b7368a", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.4455295523830572, "ground_truth": 0}, {"key": "e5e837f2cc75fc44ebf826822aa4c9dc59344b8b", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.2643583417321406, "ground_truth": 0}, {"key": "e5e837f2cc75fc44ebf826822aa4c9dc59344b8b", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.22953520021879867, "ground_truth": 0}, {"key": "e5e837f2cc75fc44ebf826822aa4c9dc59344b8b", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.2227001383151916, "ground_truth": 0}, {"key": "e5e837f2cc75fc44ebf826822aa4c9dc59344b8b", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.22541661393249413, "ground_truth": 0}, {"key": "e5e837f2cc75fc44ebf826822aa4c9dc59344b8b", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.2909808653738026, "ground_truth": 0}, {"key": "1317a869cc1d6d534a93eaad67fb6550aa155ae6", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.4167966485841138, "ground_truth": 0}, {"key": "1317a869cc1d6d534a93eaad67fb6550aa155ae6", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.3923368543194815, "ground_truth": 0}, {"key": "1317a869cc1d6d534a93eaad67fb6550aa155ae6", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.2845760067904176, "ground_truth": 0}, {"key": "1317a869cc1d6d534a93eaad67fb6550aa155ae6", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.22541660851738193, "ground_truth": 0}, {"key": "1317a869cc1d6d534a93eaad67fb6550aa155ae6", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.34510528255426914, "ground_truth": 0}, {"key": "f856ca4cd15992e0e88ae9113bf31b2a5ab55072", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.7813306302057292, "ground_truth": 0}, {"key": "f856ca4cd15992e0e88ae9113bf31b2a5ab55072", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.715423979506038, "ground_truth": 0}, {"key": "f856ca4cd15992e0e88ae9113bf31b2a5ab55072", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.8056321833411484, "ground_truth": 0}, {"key": "f856ca4cd15992e0e88ae9113bf31b2a5ab55072", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.5813030942682617, "ground_truth": 0}, {"key": "f856ca4cd15992e0e88ae9113bf31b2a5ab55072", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.48438009435787827, "ground_truth": 0}, {"key": "438e8eaa1c64cb59288f9954355d0100181d19a2", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.44360039648910504, "ground_truth": 0}, {"key": "438e8eaa1c64cb59288f9954355d0100181d19a2", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.36658974986349, "ground_truth": 0}, {"key": "438e8eaa1c64cb59288f9954355d0100181d19a2", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.5214711394031027, "ground_truth": 0}, {"key": "438e8eaa1c64cb59288f9954355d0100181d19a2", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.4960938275776476, "ground_truth": 0}, {"key": "438e8eaa1c64cb59288f9954355d0100181d19a2", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.26284180911800353, "ground_truth": 0}, {"key": "470618f9fd48a5d134a44b5de166b625f596a0b3", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.3451052599664374, "ground_truth": 0}, {"key": "470618f9fd48a5d134a44b5de166b625f596a0b3", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.29421495853912427, "ground_truth": 0}, {"key": "470618f9fd48a5d134a44b5de166b625f596a0b3", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.5660185499891082, "ground_truth": 0}, {"key": "470618f9fd48a5d134a44b5de166b625f596a0b3", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.46490156549842776, "ground_truth": 0}, {"key": "470618f9fd48a5d134a44b5de166b625f596a0b3", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.5525397062708408, "ground_truth": 0}, {"key": "751e8f720d24c57e79cf63d9a3f72cd80c5d9619", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.2509127842202893, "ground_truth": 0}, {"key": "751e8f720d24c57e79cf63d9a3f72cd80c5d9619", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.25091277648266697, "ground_truth": 0}, {"key": "751e8f720d24c57e79cf63d9a3f72cd80c5d9619", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.18476749870558973, "ground_truth": 0}, {"key": "751e8f720d24c57e79cf63d9a3f72cd80c5d9619", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.37937838049371947, "ground_truth": 0}, {"key": "751e8f720d24c57e79cf63d9a3f72cd80c5d9619", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.27512972437313554, "ground_truth": 0}, {"key": "6a985a1090f146976d33c8b33342320a65a50211", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.12252321135809446, "ground_truth": 0}, {"key": "6a985a1090f146976d33c8b33342320a65a50211", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.12678517743532178, "ground_truth": 0}, {"key": "6a985a1090f146976d33c8b33342320a65a50211", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.07864237809363446, "ground_truth": 0}, {"key": "6a985a1090f146976d33c8b33342320a65a50211", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.23792989000650686, "ground_truth": 0}, {"key": "6a985a1090f146976d33c8b33342320a65a50211", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.23091976251516172, "ground_truth": 0}, {"key": "4640d2f968f31bcf384d8253e055611b10f4a38b", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.19193279116526982, "ground_truth": 0}, {"key": "4640d2f968f31bcf384d8253e055611b10f4a38b", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.1441488534287986, "ground_truth": 0}, {"key": "4640d2f968f31bcf384d8253e055611b10f4a38b", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.45519857093133115, "ground_truth": 0}, {"key": "4640d2f968f31bcf384d8253e055611b10f4a38b", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.22678363679914276, "ground_truth": 0}, {"key": "4640d2f968f31bcf384d8253e055611b10f4a38b", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.16451646333319395, "ground_truth": 0}, {"key": "22e0c9ba3465840583a5fd79714d2f7663c7e3a1", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.36658972891166525, "ground_truth": 0}, {"key": "22e0c9ba3465840583a5fd79714d2f7663c7e3a1", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.3867634297180532, "ground_truth": 0}, {"key": "22e0c9ba3465840583a5fd79714d2f7663c7e3a1", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.25832598754979325, "ground_truth": 0}, {"key": "22e0c9ba3465840583a5fd79714d2f7663c7e3a1", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.21076631419295846, "ground_truth": 0}, {"key": "22e0c9ba3465840583a5fd79714d2f7663c7e3a1", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.2974699344192546, "ground_truth": 0}, {"key": "10dafcc21761c60f8fc5bd832daf8f21cf0fc66d", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.1285251303360016, "ground_truth": 0}, {"key": "10dafcc21761c60f8fc5bd832daf8f21cf0fc66d", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.14903529249781414, "ground_truth": 0}, {"key": "10dafcc21761c60f8fc5bd832daf8f21cf0fc66d", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.21733750372543176, "ground_truth": 0}, {"key": "10dafcc21761c60f8fc5bd832daf8f21cf0fc66d", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.1613202345899757, "ground_truth": 0}, {"key": "10dafcc21761c60f8fc5bd832daf8f21cf0fc66d", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.22541660981500264, "ground_truth": 0}, {"key": "75da85a72e0028e1b07c65f6b771a1eaa20b4e04", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.5175708752924736, "ground_truth": 0}, {"key": "75da85a72e0028e1b07c65f6b771a1eaa20b4e04", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.5, "ground_truth": 0}, {"key": "75da85a72e0028e1b07c65f6b771a1eaa20b4e04", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.5602526447653476, "ground_truth": 0}, {"key": "75da85a72e0028e1b07c65f6b771a1eaa20b4e04", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.44746031157977734, "ground_truth": 0}, {"key": "75da85a72e0028e1b07c65f6b771a1eaa20b4e04", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.5156199133434493, "ground_truth": 0}, {"key": "9166b4c77e919f7a7cc457f9df981512dea3694f", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.2186693765343125, "ground_truth": 0}, {"key": "9166b4c77e919f7a7cc457f9df981512dea3694f", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.1571368667333618, "ground_truth": 0}, {"key": "9166b4c77e919f7a7cc457f9df981512dea3694f", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.41489883171950803, "ground_truth": 0}, {"key": "9166b4c77e919f7a7cc457f9df981512dea3694f", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.4035668281816099, "ground_truth": 0}, {"key": "9166b4c77e919f7a7cc457f9df981512dea3694f", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.3380771098790447, "ground_truth": 0}, {"key": "81e50c6cdbea4e55af6307d653135ef395b6d7fe", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.8902942329773698, "ground_truth": 0}, {"key": "81e50c6cdbea4e55af6307d653135ef395b6d7fe", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.5698526530703543, "ground_truth": 0}, {"key": "81e50c6cdbea4e55af6307d653135ef395b6d7fe", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.7041601422747711, "ground_truth": 0}, {"key": "81e50c6cdbea4e55af6307d653135ef395b6d7fe", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.6774740422378112, "ground_truth": 0}, {"key": "81e50c6cdbea4e55af6307d653135ef395b6d7fe", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.8056321924041036, "ground_truth": 0}, {"key": "59fa6c3439d216272cc845d35627f8eb11b08a6d", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.8128673244150193, "ground_truth": 0}, {"key": "59fa6c3439d216272cc845d35627f8eb11b08a6d", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.7981867834312034, "ground_truth": 0}, {"key": "59fa6c3439d216272cc845d35627f8eb11b08a6d", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.8289388238453321, "ground_truth": 0}, {"key": "59fa6c3439d216272cc845d35627f8eb11b08a6d", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.6297745959879836, "ground_truth": 0}, {"key": "59fa6c3439d216272cc845d35627f8eb11b08a6d", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.7969253791324494, "ground_truth": 0}, {"key": "2eff3ba44cfaefbff89ebc764828ae9e4d477c9b", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.24653334313923894, "ground_truth": 0}, {"key": "2eff3ba44cfaefbff89ebc764828ae9e4d477c9b", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.7325918390463181, "ground_truth": 0}, {"key": "2eff3ba44cfaefbff89ebc764828ae9e4d477c9b", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.34864514382530454, "ground_truth": 0}, {"key": "2eff3ba44cfaefbff89ebc764828ae9e4d477c9b", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.5214711631556234, "ground_truth": 0}, {"key": "2eff3ba44cfaefbff89ebc764828ae9e4d477c9b", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.4513264979225981, "ground_truth": 0}, {"key": "74698ee383888faf5a49b32ecb8211b888270b76", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.47073661098783626, "ground_truth": 0}, {"key": "74698ee383888faf5a49b32ecb8211b888270b76", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.3720487774698113, "ground_truth": 0}, {"key": "74698ee383888faf5a49b32ecb8211b888270b76", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.44552955491361007, "ground_truth": 0}, {"key": "74698ee383888faf5a49b32ecb8211b888270b76", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.6132365536907053, "ground_truth": 0}, {"key": "74698ee383888faf5a49b32ecb8211b888270b76", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.3757064579501441, "ground_truth": 0}, {"key": "79a6d24f452d8c1cef47ab224fd2083b0d08324c", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.3157359950408122, "ground_truth": 0}, {"key": "79a6d24f452d8c1cef47ab224fd2083b0d08324c", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.4016878256096337, "ground_truth": 0}, {"key": "79a6d24f452d8c1cef47ab224fd2083b0d08324c", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.42441195317506214, "ground_truth": 0}, {"key": "79a6d24f452d8c1cef47ab224fd2083b0d08324c", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.36840568066098756, "ground_truth": 0}, {"key": "79a6d24f452d8c1cef47ab224fd2083b0d08324c", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.726425612934457, "ground_truth": 0}, {"key": "50f2041a2bed7f316d3254192c4158095eeec2e9", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.275129706722897, "ground_truth": 0}, {"key": "50f2041a2bed7f316d3254192c4158095eeec2e9", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.22541662522287487, "ground_truth": 0}, {"key": "50f2041a2bed7f316d3254192c4158095eeec2e9", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.2735743906094691, "ground_truth": 0}, {"key": "50f2041a2bed7f316d3254192c4158095eeec2e9", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.16559310693153287, "ground_truth": 0}, {"key": "50f2041a2bed7f316d3254192c4158095eeec2e9", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.23231015355440385, "ground_truth": 0}, {"key": "de6ed8db6d639706f2c5015c699fc578e4aa43ec", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.3504213758528811, "ground_truth": 0}, {"key": "de6ed8db6d639706f2c5015c699fc578e4aa43ec", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.20817891479149, "ground_truth": 0}, {"key": "de6ed8db6d639706f2c5015c699fc578e4aa43ec", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.3106943668575377, "ground_truth": 0}, {"key": "de6ed8db6d639706f2c5015c699fc578e4aa43ec", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.22405544224755022, "ground_truth": 0}, {"key": "de6ed8db6d639706f2c5015c699fc578e4aa43ec", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.46684559173565565, "ground_truth": 0}, {"key": "8abb66a9697a8c59348fcc79de126691e394bded", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.4571366990915237, "ground_truth": 0}, {"key": "8abb66a9697a8c59348fcc79de126691e394bded", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.2598256223643993, "ground_truth": 0}, {"key": "8abb66a9697a8c59348fcc79de126691e394bded", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.49218814924253246, "ground_truth": 0}, {"key": "8abb66a9697a8c59348fcc79de126691e394bded", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.4378234633371771, "ground_truth": 0}, {"key": "8abb66a9697a8c59348fcc79de126691e394bded", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.6406358640746586, "ground_truth": 0}, {"key": "11ec3be451b57e4312b44eeabb3ae441435c662e", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.5486734724534333, "ground_truth": 0}, {"key": "11ec3be451b57e4312b44eeabb3ae441435c662e", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.6001883752017333, "ground_truth": 0}, {"key": "11ec3be451b57e4312b44eeabb3ae441435c662e", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.4941408781274577, "ground_truth": 0}, {"key": "11ec3be451b57e4312b44eeabb3ae441435c662e", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.5039061771917009, "ground_truth": 0}, {"key": "11ec3be451b57e4312b44eeabb3ae441435c662e", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.7041601360621833, "ground_truth": 0}, {"key": "eed527dece78deffed54a7cdd8516c4d57a90011", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.5175708876559437, "ground_truth": 0}, {"key": "eed527dece78deffed54a7cdd8516c4d57a90011", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.5869964305294921, "ground_truth": 0}, {"key": "eed527dece78deffed54a7cdd8516c4d57a90011", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.7074047034818609, "ground_truth": 0}, {"key": "eed527dece78deffed54a7cdd8516c4d57a90011", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.6495786174283256, "ground_truth": 0}, {"key": "eed527dece78deffed54a7cdd8516c4d57a90011", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.8056321986263281, "ground_truth": 0}, {"key": "803c0dc8b3d2eb528fd084b613dfc29d98151d72", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.36840567606520425, "ground_truth": 0}, {"key": "803c0dc8b3d2eb528fd084b613dfc29d98151d72", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.5389832410912008, "ground_truth": 0}, {"key": "803c0dc8b3d2eb528fd084b613dfc29d98151d72", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.3451052749284009, "ground_truth": 0}, {"key": "803c0dc8b3d2eb528fd084b613dfc29d98151d72", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.36477755725120536, "ground_truth": 0}, {"key": "803c0dc8b3d2eb528fd084b613dfc29d98151d72", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.3830641812715971, "ground_truth": 0}, {"key": "d4fb4cca753c0f5586bd93bb124b0491711396d9", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.2861692413798983, "ground_truth": 0}, {"key": "d4fb4cca753c0f5586bd93bb124b0491711396d9", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.3775406682319546, "ground_truth": 0}, {"key": "d4fb4cca753c0f5586bd93bb124b0491711396d9", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.256832012747691, "ground_truth": 0}, {"key": "d4fb4cca753c0f5586bd93bb124b0491711396d9", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.26133093200373664, "ground_truth": 0}, {"key": "d4fb4cca753c0f5586bd93bb124b0491711396d9", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.20561503779859466, "ground_truth": 0}, {"key": "723443b1c16e2276a1aa03259a600044e86c2538", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.3923368395787016, "ground_truth": 0}, {"key": "723443b1c16e2276a1aa03259a600044e86c2538", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.34864515775044086, "ground_truth": 0}, {"key": "723443b1c16e2276a1aa03259a600044e86c2538", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.3757064497410327, "ground_truth": 0}, {"key": "723443b1c16e2276a1aa03259a600044e86c2538", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.36658972128755907, "ground_truth": 0}, {"key": "723443b1c16e2276a1aa03259a600044e86c2538", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.3812195777463108, "ground_truth": 0}, {"key": "b30a8f4dbb4f8375a8a9c2ccb4f658cc66dca0f5", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.21076632032992393, "ground_truth": 0}, {"key": "b30a8f4dbb4f8375a8a9c2ccb4f658cc66dca0f5", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.18713269288016707, "ground_truth": 0}, {"key": "b30a8f4dbb4f8375a8a9c2ccb4f658cc66dca0f5", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.31573598002132064, "ground_truth": 0}, {"key": "b30a8f4dbb4f8375a8a9c2ccb4f658cc66dca0f5", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.09602548619011346, "ground_truth": 0}, {"key": "b30a8f4dbb4f8375a8a9c2ccb4f658cc66dca0f5", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.31912136768100774, "ground_truth": 0}, {"key": "f874dc1da36d2c45a65f78dc0dc9dcdf5846c3c9", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.25091278292154173, "ground_truth": 0}, {"key": "f874dc1da36d2c45a65f78dc0dc9dcdf5846c3c9", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.5794004125929126, "ground_truth": 0}, {"key": "f874dc1da36d2c45a65f78dc0dc9dcdf5846c3c9", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.15817436019229034, "ground_truth": 0}, {"key": "f874dc1da36d2c45a65f78dc0dc9dcdf5846c3c9", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.4359015376149972, "ground_truth": 0}, {"key": "f874dc1da36d2c45a65f78dc0dc9dcdf5846c3c9", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.6039318042582742, "ground_truth": 0}, {"key": "60fc2801c429858cc0a87e547f1c30e34a7a96f3", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.18242552519208163, "ground_truth": 0}, {"key": "60fc2801c429858cc0a87e547f1c30e34a7a96f3", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.3960681665748212, "ground_truth": 0}, {"key": "60fc2801c429858cc0a87e547f1c30e34a7a96f3", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.36477752743355446, "ground_truth": 0}, {"key": "60fc2801c429858cc0a87e547f1c30e34a7a96f3", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.5019531316743934, "ground_truth": 0}, {"key": "60fc2801c429858cc0a87e547f1c30e34a7a96f3", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.4980468850285969, "ground_truth": 0}, {"key": "d885b755dab03a11c7e3b19455b82859a6e1f76b", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.22000710718454353, "ground_truth": 0}, {"key": "d885b755dab03a11c7e3b19455b82859a6e1f76b", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.3998116212207366, "ground_truth": 0}, {"key": "d885b755dab03a11c7e3b19455b82859a6e1f76b", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.4054487663546549, "ground_truth": 0}, {"key": "d885b755dab03a11c7e3b19455b82859a6e1f76b", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.24653333972567706, "ground_truth": 0}, {"key": "d885b755dab03a11c7e3b19455b82859a6e1f76b", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.28140559310025376, "ground_truth": 0}, {"key": "9ce486aae2ad61c78b2e44d2617276a470c9f600", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.364777558614664, "ground_truth": 0}, {"key": "9ce486aae2ad61c78b2e44d2617276a470c9f600", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.2254166140856445, "ground_truth": 0}, {"key": "9ce486aae2ad61c78b2e44d2617276a470c9f600", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.26133092259975527, "ground_truth": 0}, {"key": "9ce486aae2ad61c78b2e44d2617276a470c9f600", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.25832599134565093, "ground_truth": 0}, {"key": "9ce486aae2ad61c78b2e44d2617276a470c9f600", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.4765796380694386, "ground_truth": 0}, {"key": "162e54974cad1d0e067a97e37175951c26f13a0e", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.6001883874143343, "ground_truth": 0}, {"key": "162e54974cad1d0e067a97e37175951c26f13a0e", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.33458944148125513, "ground_truth": 0}, {"key": "162e54974cad1d0e067a97e37175951c26f13a0e", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.2974699152013062, "ground_truth": 0}, {"key": "162e54974cad1d0e067a97e37175951c26f13a0e", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.6279512232591573, "ground_truth": 0}, {"key": "162e54974cad1d0e067a97e37175951c26f13a0e", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.7401743803787375, "ground_truth": 0}, {"key": "03a0cef9c902928979ef731616fb96bd1fb10f9f", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.6388352851880258, "ground_truth": 0}, {"key": "03a0cef9c902928979ef731616fb96bd1fb10f9f", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.4111108457709738, "ground_truth": 0}, {"key": "03a0cef9c902928979ef731616fb96bd1fb10f9f", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.38121957054026184, "ground_truth": 0}, {"key": "03a0cef9c902928979ef731616fb96bd1fb10f9f", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.5544704651885761, "ground_truth": 0}, {"key": "03a0cef9c902928979ef731616fb96bd1fb10f9f", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.44746029439856594, "ground_truth": 0}, {"key": "6f64897fc65e1ba7531a4830a7d935ab15d8bec6", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.31405053667934735, "ground_truth": 0}, {"key": "6f64897fc65e1ba7531a4830a7d935ab15d8bec6", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.3157359764873022, "ground_truth": 0}, {"key": "6f64897fc65e1ba7531a4830a7d935ab15d8bec6", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.4320633939221324, "ground_truth": 0}, {"key": "6f64897fc65e1ba7531a4830a7d935ab15d8bec6", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.21733750748947914, "ground_truth": 0}, {"key": "6f64897fc65e1ba7531a4830a7d935ab15d8bec6", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.20946969192546333, "ground_truth": 0}, {"key": "0d7383a44955b41c5a472151a35a842751f0004c", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.2766905386630296, "ground_truth": 0}, {"key": "0d7383a44955b41c5a472151a35a842751f0004c", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.35756752738092606, "ground_truth": 0}, {"key": "0d7383a44955b41c5a472151a35a842751f0004c", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.2720245523779168, "ground_truth": 0}, {"key": "0d7383a44955b41c5a472151a35a842751f0004c", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.42059959306935957, "ground_truth": 0}, {"key": "0d7383a44955b41c5a472151a35a842751f0004c", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.3398276267972054, "ground_truth": 0}, {"key": "2fddefe691f7849048548a15f6533339d4a25bfd", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.4301473276565802, "ground_truth": 0}, {"key": "2fddefe691f7849048548a15f6533339d4a25bfd", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.20181322028390564, "ground_truth": 0}, {"key": "2fddefe691f7849048548a15f6533339d4a25bfd", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.37570648774769133, "ground_truth": 0}, {"key": "2fddefe691f7849048548a15f6533339d4a25bfd", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.5273165295210384, "ground_truth": 0}, {"key": "2fddefe691f7849048548a15f6533339d4a25bfd", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.18242553425778085, "ground_truth": 0}, {"key": "e35ec8afe496d466d673ac67d80ec5c21b163410", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.2450850134866674, "ground_truth": 0}, {"key": "e35ec8afe496d466d673ac67d80ec5c21b163410", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.18713269288016707, "ground_truth": 0}, {"key": "e35ec8afe496d466d673ac67d80ec5c21b163410", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.2720245695543264, "ground_truth": 0}, {"key": "e35ec8afe496d466d673ac67d80ec5c21b163410", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.19193279955409692, "ground_truth": 0}, {"key": "e35ec8afe496d466d673ac67d80ec5c21b163410", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.5214711592781637, "ground_truth": 0}, {"key": "b4aa207f0723ae8a731dbc07ecdb03a68a42031f", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.25091275583239014, "ground_truth": 0}, {"key": "b4aa207f0723ae8a731dbc07ecdb03a68a42031f", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.14318770036016165, "ground_truth": 0}, {"key": "b4aa207f0723ae8a731dbc07ecdb03a68a42031f", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.3276683021054899, "ground_truth": 0}, {"key": "b4aa207f0723ae8a731dbc07ecdb03a68a42031f", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.34687307840341863, "ground_truth": 0}, {"key": "b4aa207f0723ae8a731dbc07ecdb03a68a42031f", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.24944725577569443, "ground_truth": 0}, {"key": "a65ecd71682863f7b12ca11ab8ac23b39ae302c4", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.09467771415232262, "ground_truth": 0}, {"key": "a65ecd71682863f7b12ca11ab8ac23b39ae302c4", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.47268345041703924, "ground_truth": 0}, {"key": "a65ecd71682863f7b12ca11ab8ac23b39ae302c4", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.10669060094364034, "ground_truth": 0}, {"key": "a65ecd71682863f7b12ca11ab8ac23b39ae302c4", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.5563995918819593, "ground_truth": 0}, {"key": "a65ecd71682863f7b12ca11ab8ac23b39ae302c4", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.14223188203655462, "ground_truth": 0}, {"key": "215a2a64c7bd36360f76ec5e159690de07d7d959", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.10594829035055234, "ground_truth": 0}, {"key": "215a2a64c7bd36360f76ec5e159690de07d7d959", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.17106117968474951, "ground_truth": 0}, {"key": "215a2a64c7bd36360f76ec5e159690de07d7d959", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.23934935112152286, "ground_truth": 0}, {"key": "215a2a64c7bd36360f76ec5e159690de07d7d959", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.22270015201238727, "ground_truth": 0}, {"key": "215a2a64c7bd36360f76ec5e159690de07d7d959", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.2814055825531725, "ground_truth": 0}, {"key": "39074eb06df4966d1e06f76ad2f0713b31335fe5", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.3486451292081193, "ground_truth": 0}, {"key": "39074eb06df4966d1e06f76ad2f0713b31335fe5", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.6531269096116301, "ground_truth": 0}, {"key": "39074eb06df4966d1e06f76ad2f0713b31335fe5", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.5448013911699233, "ground_truth": 0}, {"key": "39074eb06df4966d1e06f76ad2f0713b31335fe5", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.692642006068383, "ground_truth": 0}, {"key": "39074eb06df4966d1e06f76ad2f0713b31335fe5", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.48438008478136535, "ground_truth": 0}, {"key": "3cae0d9bcf97b5d182b20a31aaea3f41cd7bf599", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.20817893473732405, "ground_truth": 0}, {"key": "3cae0d9bcf97b5d182b20a31aaea3f41cd7bf599", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.31912138656280686, "ground_truth": 0}, {"key": "3cae0d9bcf97b5d182b20a31aaea3f41cd7bf599", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.13939638410850974, "ground_truth": 0}, {"key": "3cae0d9bcf97b5d182b20a31aaea3f41cd7bf599", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.19193278653820237, "ground_truth": 0}, {"key": "3cae0d9bcf97b5d182b20a31aaea3f41cd7bf599", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.2658804791161448, "ground_truth": 0}, {"key": "6a9ead70f9423e494c466189bc6d907071547f42", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.799442322068178, "ground_truth": 0}, {"key": "6a9ead70f9423e494c466189bc6d907071547f42", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.8397339538055357, "ground_truth": 0}, {"key": "6a9ead70f9423e494c466189bc6d907071547f42", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.8255897123226144, "ground_truth": 0}, {"key": "6a9ead70f9423e494c466189bc6d907071547f42", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.6859494661669706, "ground_truth": 0}, {"key": "6a9ead70f9423e494c466189bc6d907071547f42", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.6654105633362645, "ground_truth": 0}, {"key": "9a15663058028878027f6aa039fb3185c2ff52c8", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.3345894449133369, "ground_truth": 0}, {"key": "9a15663058028878027f6aa039fb3185c2ff52c8", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.2766905320386755, "ground_truth": 0}, {"key": "9a15663058028878027f6aa039fb3185c2ff52c8", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.12506538298306324, "ground_truth": 0}, {"key": "9a15663058028878027f6aa039fb3185c2ff52c8", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.26894139933540123, "ground_truth": 0}, {"key": "9a15663058028878027f6aa039fb3185c2ff52c8", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.6334102547744376, "ground_truth": 0}, {"key": "83cb0c7e79d4c71703e1bd5fc346fe68be8b8b13", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.4687906446348592, "ground_truth": 0}, {"key": "83cb0c7e79d4c71703e1bd5fc346fe68be8b8b13", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.594551254789276, "ground_truth": 0}, {"key": "83cb0c7e79d4c71703e1bd5fc346fe68be8b8b13", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.43206338747465994, "ground_truth": 0}, {"key": "83cb0c7e79d4c71703e1bd5fc346fe68be8b8b13", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.4980469277581446, "ground_truth": 0}, {"key": "83cb0c7e79d4c71703e1bd5fc346fe68be8b8b13", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.2909808715115661, "ground_truth": 0}, {"key": "5eb63517219a5d2aeebd21aa66d9b69c52cfb208", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.3468730950192094, "ground_truth": 0}, {"key": "5eb63517219a5d2aeebd21aa66d9b69c52cfb208", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.5039061924319846, "ground_truth": 0}, {"key": "5eb63517219a5d2aeebd21aa66d9b69c52cfb208", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.370225407973461, "ground_truth": 0}, {"key": "5eb63517219a5d2aeebd21aa66d9b69c52cfb208", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.4902356247113809, "ground_truth": 0}, {"key": "5eb63517219a5d2aeebd21aa66d9b69c52cfb208", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.5019531361320007, "ground_truth": 0}, {"key": "4a1de02b50578df33ea7b0cb384bdd6aaf4ee119", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.1520322372880679, "ground_truth": 0}, {"key": "4a1de02b50578df33ea7b0cb384bdd6aaf4ee119", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.18832398142797246, "ground_truth": 0}, {"key": "4a1de02b50578df33ea7b0cb384bdd6aaf4ee119", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.1943678117626668, "ground_truth": 0}, {"key": "4a1de02b50578df33ea7b0cb384bdd6aaf4ee119", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.15405755069880978, "ground_truth": 0}, {"key": "4a1de02b50578df33ea7b0cb384bdd6aaf4ee119", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.2068940534139215, "ground_truth": 0}, {"key": "ddedfc2a349fb607ed7efeda1660e9807454ddb7", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.4225046011615868, "ground_truth": 0}, {"key": "ddedfc2a349fb607ed7efeda1660e9807454ddb7", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.6566582896467084, "ground_truth": 0}, {"key": "ddedfc2a349fb607ed7efeda1660e9807454ddb7", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.22953521698320073, "ground_truth": 0}, {"key": "ddedfc2a349fb607ed7efeda1660e9807454ddb7", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.327668300649582, "ground_truth": 0}, {"key": "ddedfc2a349fb607ed7efeda1660e9807454ddb7", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.535098422794684, "ground_truth": 0}, {"key": "1cce8238a161fda411022c350d2b9a49072f366f", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.21733753812768475, "ground_truth": 0}, {"key": "1cce8238a161fda411022c350d2b9a49072f366f", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.3793783781676312, "ground_truth": 0}, {"key": "1cce8238a161fda411022c350d2b9a49072f366f", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.2958398451023165, "ground_truth": 0}, {"key": "1cce8238a161fda411022c350d2b9a49072f366f", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.38121954573707906, "ground_truth": 0}, {"key": "1cce8238a161fda411022c350d2b9a49072f366f", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.30902373424842394, "ground_truth": 0}, {"key": "0612042c0c7d5cf6459f5435402919673c8c552f", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.409220796155449, "ground_truth": 0}, {"key": "0612042c0c7d5cf6459f5435402919673c8c552f", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.47657964139076814, "ground_truth": 0}, {"key": "0612042c0c7d5cf6459f5435402919673c8c552f", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.2877678028798378, "ground_truth": 0}, {"key": "0612042c0c7d5cf6459f5435402919673c8c552f", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.3242354067082848, "ground_truth": 0}, {"key": "0612042c0c7d5cf6459f5435402919673c8c552f", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.3468730937480154, "ground_truth": 0}, {"key": "cbe1f7ee7f5d619093684cc123e3908e39d79c92", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.19930800534266258, "ground_truth": 0}, {"key": "cbe1f7ee7f5d619093684cc123e3908e39d79c92", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.48828338505510227, "ground_truth": 0}, {"key": "cbe1f7ee7f5d619093684cc123e3908e39d79c92", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.39047582322162094, "ground_truth": 0}, {"key": "cbe1f7ee7f5d619093684cc123e3908e39d79c92", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.37570645336013403, "ground_truth": 0}, {"key": "cbe1f7ee7f5d619093684cc123e3908e39d79c92", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.6808786348037816, "ground_truth": 0}, {"key": "42be47d5986a9a55b413eb57359d2d8c51b59024", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.16026602897179246, "ground_truth": 0}, {"key": "42be47d5986a9a55b413eb57359d2d8c51b59024", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.6001883584227264, "ground_truth": 0}, {"key": "42be47d5986a9a55b413eb57359d2d8c51b59024", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.3191214062965253, "ground_truth": 0}, {"key": "42be47d5986a9a55b413eb57359d2d8c51b59024", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.6876299858605013, "ground_truth": 0}, {"key": "42be47d5986a9a55b413eb57359d2d8c51b59024", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.20561504344257509, "ground_truth": 0}, {"key": "9f997964709283520a65d2ce75de7c8b154ce351", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.37937840359865155, "ground_truth": 0}, {"key": "9f997964709283520a65d2ce75de7c8b154ce351", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.482429147218858, "ground_truth": 0}, {"key": "9f997964709283520a65d2ce75de7c8b154ce351", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.27048020163757275, "ground_truth": 0}, {"key": "9f997964709283520a65d2ce75de7c8b154ce351", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.49414089764837615, "ground_truth": 0}, {"key": "9f997964709283520a65d2ce75de7c8b154ce351", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.411110882278316, "ground_truth": 0}, {"key": "57da930302d81b46438b0f715a5218b7174a5611", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.6169358303458865, "ground_truth": 0}, {"key": "57da930302d81b46438b0f715a5218b7174a5611", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.3208212822372766, "ground_truth": 0}, {"key": "57da930302d81b46438b0f715a5218b7174a5611", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.6513548505777971, "ground_truth": 0}, {"key": "57da930302d81b46438b0f715a5218b7174a5611", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.6636689491226576, "ground_truth": 0}, {"key": "57da930302d81b46438b0f715a5218b7174a5611", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.638835257416944, "ground_truth": 0}, {"key": "bc639974d283826b3b928bf90f0951652db71fd4", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.3123699994418036, "ground_truth": 0}, {"key": "bc639974d283826b3b928bf90f0951652db71fd4", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.16995622220488923, "ground_truth": 0}, {"key": "bc639974d283826b3b928bf90f0951652db71fd4", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.4882833960159579, "ground_truth": 0}, {"key": "bc639974d283826b3b928bf90f0951652db71fd4", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.11357958984953513, "ground_truth": 0}, {"key": "bc639974d283826b3b928bf90f0951652db71fd4", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.19559407976474413, "ground_truth": 0}, {"key": "304002bc095b57d14b728ccfb8d704ef39f28813", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.6057990310972383, "ground_truth": 0}, {"key": "304002bc095b57d14b728ccfb8d704ef39f28813", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.23231015228839313, "ground_truth": 0}, {"key": "304002bc095b57d14b728ccfb8d704ef39f28813", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.37754070502879955, "ground_truth": 0}, {"key": "304002bc095b57d14b728ccfb8d704ef39f28813", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.405448758226489, "ground_truth": 0}, {"key": "304002bc095b57d14b728ccfb8d704ef39f28813", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.1581743640896503, "ground_truth": 0}, {"key": "fab941df6ecc8251b49d28715504baf4ac31dcf9", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.10743747225272761, "ground_truth": 0}, {"key": "fab941df6ecc8251b49d28715504baf4ac31dcf9", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.5660184972969621, "ground_truth": 0}, {"key": "fab941df6ecc8251b49d28715504baf4ac31dcf9", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.09009299252778864, "ground_truth": 0}, {"key": "fab941df6ecc8251b49d28715504baf4ac31dcf9", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.09334687435835567, "ground_truth": 0}, {"key": "fab941df6ecc8251b49d28715504baf4ac31dcf9", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.27825679159571765, "ground_truth": 0}, {"key": "92dec9732f4244771770150d82cd6086f40e5621", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.39981163700753936, "ground_truth": 0}, {"key": "92dec9732f4244771770150d82cd6086f40e5621", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.3504213899719455, "ground_truth": 0}, {"key": "92dec9732f4244771770150d82cd6086f40e5621", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.39047586134081047, "ground_truth": 0}, {"key": "92dec9732f4244771770150d82cd6086f40e5621", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.37022538761398455, "ground_truth": 0}, {"key": "92dec9732f4244771770150d82cd6086f40e5621", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.46295861087911155, "ground_truth": 0}, {"key": "d2ed554726c632af6e2130a580964a261f8c2e60", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.17553808111927316, "ground_truth": 0}, {"key": "d2ed554726c632af6e2130a580964a261f8c2e60", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.24220562809209373, "ground_truth": 0}, {"key": "d2ed554726c632af6e2130a580964a261f8c2e60", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.13477592045444334, "ground_truth": 0}, {"key": "d2ed554726c632af6e2130a580964a261f8c2e60", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.131173225184135, "ground_truth": 0}, {"key": "d2ed554726c632af6e2130a580964a261f8c2e60", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.21337715333301127, "ground_truth": 0}, {"key": "84ab5256295369509813877f5000bb7e01e7f641", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.6842640131932962, "ground_truth": 0}, {"key": "84ab5256295369509813877f5000bb7e01e7f641", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.3738758195273627, "ground_truth": 0}, {"key": "84ab5256295369509813877f5000bb7e01e7f641", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.5602526623107914, "ground_truth": 0}, {"key": "84ab5256295369509813877f5000bb7e01e7f641", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.6057990558724641, "ground_truth": 0}, {"key": "84ab5256295369509813877f5000bb7e01e7f641", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.6224593109077009, "ground_truth": 0}, {"key": "0e3f2fa30b711144fd8e49dedd6c248542a9083c", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.35042137857925176, "ground_truth": 0}, {"key": "0e3f2fa30b711144fd8e49dedd6c248542a9083c", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.6566582607004531, "ground_truth": 0}, {"key": "0e3f2fa30b711144fd8e49dedd6c248542a9083c", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.6334102567407063, "ground_truth": 0}, {"key": "0e3f2fa30b711144fd8e49dedd6c248542a9083c", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.5058591134352542, "ground_truth": 0}, {"key": "0e3f2fa30b711144fd8e49dedd6c248542a9083c", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.6352224417145061, "ground_truth": 0}, {"key": "67ab697c3e2d707e3b7d070199b065b1541c8925", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.590779184896303, "ground_truth": 0}, {"key": "67ab697c3e2d707e3b7d070199b065b1541c8925", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.3904758744518346, "ground_truth": 0}, {"key": "67ab697c3e2d707e3b7d070199b065b1541c8925", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.531209374842465, "ground_truth": 0}, {"key": "67ab697c3e2d707e3b7d070199b065b1541c8925", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.5156199178189753, "ground_truth": 0}, {"key": "67ab697c3e2d707e3b7d070199b065b1541c8925", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.4130035716739997, "ground_truth": 0}, {"key": "71537a701b69838dcb68ae310c7b3bfb375c1344", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.21076630158859558, "ground_truth": 0}, {"key": "71537a701b69838dcb68ae310c7b3bfb375c1344", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.11838510582089594, "ground_truth": 0}, {"key": "71537a701b69838dcb68ae310c7b3bfb375c1344", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.26284184083291307, "ground_truth": 0}, {"key": "71537a701b69838dcb68ae310c7b3bfb375c1344", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.2081789294078026, "ground_truth": 0}, {"key": "71537a701b69838dcb68ae310c7b3bfb375c1344", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.23231011566367019, "ground_truth": 0}, {"key": "83989da5142972bb45c7f1e25ea60c6b101a9987", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.2861692434685, "ground_truth": 0}, {"key": "83989da5142972bb45c7f1e25ea60c6b101a9987", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.4167966364661414, "ground_truth": 0}, {"key": "83989da5142972bb45c7f1e25ea60c6b101a9987", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.20689405184076115, "ground_truth": 0}, {"key": "83989da5142972bb45c7f1e25ea60c6b101a9987", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.45519861403098016, "ground_truth": 0}, {"key": "83989da5142972bb45c7f1e25ea60c6b101a9987", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.35398627971890434, "ground_truth": 0}, {"key": "cc432e8a26891d7fcb62b112f868e994532a7ba7", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.346873076092112, "ground_truth": 0}, {"key": "cc432e8a26891d7fcb62b112f868e994532a7ba7", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.11596071567776407, "ground_truth": 0}, {"key": "cc432e8a26891d7fcb62b112f868e994532a7ba7", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.4148988229670789, "ground_truth": 0}, {"key": "cc432e8a26891d7fcb62b112f868e994532a7ba7", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.1919327619509154, "ground_truth": 0}, {"key": "cc432e8a26891d7fcb62b112f868e994532a7ba7", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.34864513479105447, "ground_truth": 0}, {"key": "ef024e4ca04bd445d2915e7fe5c2c3c9b6f723a2", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.20817893223932574, "ground_truth": 0}, {"key": "ef024e4ca04bd445d2915e7fe5c2c3c9b6f723a2", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.20181322710793098, "ground_truth": 0}, {"key": "ef024e4ca04bd445d2915e7fe5c2c3c9b6f723a2", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.14804719464706925, "ground_truth": 0}, {"key": "ef024e4ca04bd445d2915e7fe5c2c3c9b6f723a2", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.2925952934717966, "ground_truth": 0}, {"key": "ef024e4ca04bd445d2915e7fe5c2c3c9b6f723a2", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.26435834705613204, "ground_truth": 0}, {"key": "dfc606b97c43ac249d72cff2fe812213987a37a2", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.3140505366747359, "ground_truth": 0}, {"key": "dfc606b97c43ac249d72cff2fe812213987a37a2", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.373875819227248, "ground_truth": 0}, {"key": "dfc606b97c43ac249d72cff2fe812213987a37a2", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.38121955579048983, "ground_truth": 0}, {"key": "dfc606b97c43ac249d72cff2fe812213987a37a2", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.2643583621046277, "ground_truth": 0}, {"key": "dfc606b97c43ac249d72cff2fe812213987a37a2", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.30074557364658927, "ground_truth": 0}, {"key": "087ac92e2ca469b5ca6277950e63b2f0706d0de2", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.220007101983302, "ground_truth": 0}, {"key": "087ac92e2ca469b5ca6277950e63b2f0706d0de2", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.2479874113607972, "ground_truth": 0}, {"key": "087ac92e2ca469b5ca6277950e63b2f0706d0de2", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.23091975124165706, "ground_truth": 0}, {"key": "087ac92e2ca469b5ca6277950e63b2f0706d0de2", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.23510839189775476, "ground_truth": 0}, {"key": "087ac92e2ca469b5ca6277950e63b2f0706d0de2", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.11357959694713272, "ground_truth": 0}, {"key": "a1abb9ce1c76a6c390233d8ec934cfb34bc35215", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.17441027653340774, "ground_truth": 0}, {"key": "a1abb9ce1c76a6c390233d8ec934cfb34bc35215", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.379378386095685, "ground_truth": 0}, {"key": "a1abb9ce1c76a6c390233d8ec934cfb34bc35215", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.6740505005061783, "ground_truth": 0}, {"key": "a1abb9ce1c76a6c390233d8ec934cfb34bc35215", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.41111088744183266, "ground_truth": 0}, {"key": "a1abb9ce1c76a6c390233d8ec934cfb34bc35215", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.24220564754936982, "ground_truth": 0}, {"key": "99ec57979392a7f9c1a24158d5e1262cdf113f45", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.3486451442148947, "ground_truth": 0}, {"key": "99ec57979392a7f9c1a24158d5e1262cdf113f45", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.2240554275769217, "ground_truth": 0}, {"key": "99ec57979392a7f9c1a24158d5e1262cdf113f45", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.15713685551855788, "ground_truth": 0}, {"key": "99ec57979392a7f9c1a24158d5e1262cdf113f45", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.2146914267747622, "ground_truth": 0}, {"key": "99ec57979392a7f9c1a24158d5e1262cdf113f45", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.4244120048256912, "ground_truth": 0}, {"key": "ca5c0c816376354b82a4a7b9fa9a31b655e2d2cd", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.11920292612819075, "ground_truth": 0}, {"key": "ca5c0c816376354b82a4a7b9fa9a31b655e2d2cd", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.16776334422765576, "ground_truth": 0}, {"key": "ca5c0c816376354b82a4a7b9fa9a31b655e2d2cd", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.2798284723412757, "ground_truth": 0}, {"key": "ca5c0c816376354b82a4a7b9fa9a31b655e2d2cd", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.13386748491801448, "ground_truth": 0}, {"key": "ca5c0c816376354b82a4a7b9fa9a31b655e2d2cd", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.1789558909857545, "ground_truth": 0}, {"key": "e9787bf9462b12b7dfc0b562510a551e7d07b4d7", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.3998116410256193, "ground_truth": 0}, {"key": "e9787bf9462b12b7dfc0b562510a551e7d07b4d7", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.6020616223012684, "ground_truth": 0}, {"key": "e9787bf9462b12b7dfc0b562510a551e7d07b4d7", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.5273165197995798, "ground_truth": 0}, {"key": "e9787bf9462b12b7dfc0b562510a551e7d07b4d7", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.24077459528568126, "ground_truth": 0}, {"key": "e9787bf9462b12b7dfc0b562510a551e7d07b4d7", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.4263215970986384, "ground_truth": 0}, {"key": "ed8a7d5b06b4b5415725e624a15ab5ada7146894", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.1540575495690627, "ground_truth": 0}, {"key": "ed8a7d5b06b4b5415725e624a15ab5ada7146894", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.2861692224983988, "ground_truth": 0}, {"key": "ed8a7d5b06b4b5415725e624a15ab5ada7146894", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.25238402475795635, "ground_truth": 0}, {"key": "ed8a7d5b06b4b5415725e624a15ab5ada7146894", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.30404169024510597, "ground_truth": 0}, {"key": "ed8a7d5b06b4b5415725e624a15ab5ada7146894", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.2766905162982082, "ground_truth": 0}, {"key": "4b6f2532f6bb4cf4ae341e4fb72d384ef58f0f42", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.30902371687004865, "ground_truth": 0}, {"key": "4b6f2532f6bb4cf4ae341e4fb72d384ef58f0f42", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.19193277967663877, "ground_truth": 0}, {"key": "4b6f2532f6bb4cf4ae341e4fb72d384ef58f0f42", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.12592275797940639, "ground_truth": 0}, {"key": "4b6f2532f6bb4cf4ae341e4fb72d384ef58f0f42", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.13028541608260857, "ground_truth": 0}, {"key": "4b6f2532f6bb4cf4ae341e4fb72d384ef58f0f42", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.072112209722326, "ground_truth": 0}, {"key": "46102a68e2927f930c1c2bd117ca714d188cd1ab", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.32252599042327607, "ground_truth": 0}, {"key": "46102a68e2927f930c1c2bd117ca714d188cd1ab", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.2628418364660738, "ground_truth": 0}, {"key": "46102a68e2927f930c1c2bd117ca714d188cd1ab", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.21469140848349058, "ground_truth": 0}, {"key": "46102a68e2927f930c1c2bd117ca714d188cd1ab", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.2942149917366054, "ground_truth": 0}, {"key": "46102a68e2927f930c1c2bd117ca714d188cd1ab", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.16344545682894057, "ground_truth": 0}, {"key": "ee6568a8880e61a498aab80c41f70939d567c991", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.16026603260501862, "ground_truth": 0}, {"key": "ee6568a8880e61a498aab80c41f70939d567c991", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.21866937663140684, "ground_truth": 0}, {"key": "ee6568a8880e61a498aab80c41f70939d567c991", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.17781087146479413, "ground_truth": 0}, {"key": "ee6568a8880e61a498aab80c41f70939d567c991", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.12085322950122666, "ground_truth": 0}, {"key": "ee6568a8880e61a498aab80c41f70939d567c991", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.14128141499517896, "ground_truth": 0}, {"key": "8f462be265750ebbf85a6ad8ef28cb39c59f826e", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.3665897481669505, "ground_truth": 0}, {"key": "8f462be265750ebbf85a6ad8ef28cb39c59f826e", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.327668304965425, "ground_truth": 0}, {"key": "8f462be265750ebbf85a6ad8ef28cb39c59f826e", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.39420096440442565, "ground_truth": 0}, {"key": "8f462be265750ebbf85a6ad8ef28cb39c59f826e", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.43782350602215975, "ground_truth": 0}, {"key": "8f462be265750ebbf85a6ad8ef28cb39c59f826e", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.32594951716851966, "ground_truth": 0}, {"key": "b21258342db561f79656c3c75f2e8c8244dd6178", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.3433417361610964, "ground_truth": 0}, {"key": "b21258342db561f79656c3c75f2e8c8244dd6178", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.28776780497731447, "ground_truth": 0}, {"key": "b21258342db561f79656c3c75f2e8c8244dd6178", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.34510526346307463, "ground_truth": 0}, {"key": "b21258342db561f79656c3c75f2e8c8244dd6178", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.13939636732217545, "ground_truth": 0}, {"key": "b21258342db561f79656c3c75f2e8c8244dd6178", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.304041683000381, "ground_truth": 0}, {"key": "c7b97c7c2ca7b9bedff4978dd3cae9aaef8f8100", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.3904758217612684, "ground_truth": 0}, {"key": "c7b97c7c2ca7b9bedff4978dd3cae9aaef8f8100", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.33982764302878415, "ground_truth": 0}, {"key": "c7b97c7c2ca7b9bedff4978dd3cae9aaef8f8100", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.35220178126514906, "ground_truth": 0}, {"key": "c7b97c7c2ca7b9bedff4978dd3cae9aaef8f8100", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.36116474001322313, "ground_truth": 0}, {"key": "c7b97c7c2ca7b9bedff4978dd3cae9aaef8f8100", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.5506073744349428, "ground_truth": 0}, {"key": "bdbeb9265050f2a4ce200c3802775694b7dc20e6", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.2658804787229489, "ground_truth": 0}, {"key": "bdbeb9265050f2a4ce200c3802775694b7dc20e6", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.1907240174654954, "ground_truth": 0}, {"key": "bdbeb9265050f2a4ce200c3802775694b7dc20e6", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.33111973004794243, "ground_truth": 0}, {"key": "bdbeb9265050f2a4ce200c3802775694b7dc20e6", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.25832599470493023, "ground_truth": 0}, {"key": "bdbeb9265050f2a4ce200c3802775694b7dc20e6", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.15304214005766759, "ground_truth": 0}, {"key": "42e93d5aef7547b8169f1f6c7735d0265a030580", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.5195213113334078, "ground_truth": 0}, {"key": "42e93d5aef7547b8169f1f6c7735d0265a030580", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.34334171224124377, "ground_truth": 0}, {"key": "42e93d5aef7547b8169f1f6c7735d0265a030580", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.2005576917246483, "ground_truth": 0}, {"key": "42e93d5aef7547b8169f1f6c7735d0265a030580", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.4301473361499011, "ground_truth": 0}, {"key": "42e93d5aef7547b8169f1f6c7735d0265a030580", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.4016878001882368, "ground_truth": 0}, {"key": "6e7a607934780f0011aa4e84509314efe15c2685", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.43398147164047773, "ground_truth": 0}, {"key": "6e7a607934780f0011aa4e84509314efe15c2685", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.6297746196303828, "ground_truth": 0}, {"key": "6e7a607934780f0011aa4e84509314efe15c2685", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.5136684715961838, "ground_truth": 0}, {"key": "6e7a607934780f0011aa4e84509314efe15c2685", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.30404166946867034, "ground_truth": 0}, {"key": "6e7a607934780f0011aa4e84509314efe15c2685", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.5175708801585406, "ground_truth": 0}, {"key": "c087e2af172aed145b177c9a1a68029205bc732a", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.23091976495274277, "ground_truth": 0}, {"key": "c087e2af172aed145b177c9a1a68029205bc732a", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.18832398670921102, "ground_truth": 0}, {"key": "c087e2af172aed145b177c9a1a68029205bc732a", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.23231013285219934, "ground_truth": 0}, {"key": "c087e2af172aed145b177c9a1a68029205bc732a", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.20307464385462298, "ground_truth": 0}, {"key": "c087e2af172aed145b177c9a1a68029205bc732a", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.17667158826244653, "ground_truth": 0}, {"key": "40e79de5b7a27d7161b147725936d1d47e45c8f9", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.5019531145741403, "ground_truth": 0}, {"key": "40e79de5b7a27d7161b147725936d1d47e45c8f9", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.6566582811083457, "ground_truth": 0}, {"key": "40e79de5b7a27d7161b147725936d1d47e45c8f9", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.26435836014410713, "ground_truth": 0}, {"key": "40e79de5b7a27d7161b147725936d1d47e45c8f9", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.42823340893327466, "ground_truth": 0}, {"key": "40e79de5b7a27d7161b147725936d1d47e45c8f9", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.3702254065350592, "ground_truth": 0}, {"key": "e878909ace599352d3d578796968bbd52cb299bd", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.22000711761056604, "ground_truth": 0}, {"key": "e878909ace599352d3d578796968bbd52cb299bd", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.43398146326333065, "ground_truth": 0}, {"key": "e878909ace599352d3d578796968bbd52cb299bd", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.1581743318974109, "ground_truth": 0}, {"key": "e878909ace599352d3d578796968bbd52cb299bd", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.44167301982184415, "ground_truth": 0}, {"key": "e878909ace599352d3d578796968bbd52cb299bd", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.3174262643255993, "ground_truth": 0}, {"key": "470708aab0fe600a27423bf4a2f8c9860fe5f64b", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.3208212904459468, "ground_truth": 0}, {"key": "470708aab0fe600a27423bf4a2f8c9860fe5f64b", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.6442250755447075, "ground_truth": 0}, {"key": "470708aab0fe600a27423bf4a2f8c9860fe5f64b", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.28298811755460435, "ground_truth": 0}, {"key": "470708aab0fe600a27423bf4a2f8c9860fe5f64b", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.3259495210928376, "ground_truth": 0}, {"key": "470708aab0fe600a27423bf4a2f8c9860fe5f64b", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.4532618432302629, "ground_truth": 0}, {"key": "16e8cb520c874af6825d4661f6127a67efd4b6f6", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.24364244133344726, "ground_truth": 0}, {"key": "16e8cb520c874af6825d4661f6127a67efd4b6f6", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.3998116419218402, "ground_truth": 0}, {"key": "16e8cb520c874af6825d4661f6127a67efd4b6f6", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.2227001412352336, "ground_truth": 0}, {"key": "16e8cb520c874af6825d4661f6127a67efd4b6f6", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.1755380924582305, "ground_truth": 0}, {"key": "16e8cb520c874af6825d4661f6127a67efd4b6f6", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.3090237108356437, "ground_truth": 0}, {"key": "38673348ff28676905791fe3e8db2bbda814d974", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.11516223710035142, "ground_truth": 0}, {"key": "38673348ff28676905791fe3e8db2bbda814d974", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.0900930000099761, "ground_truth": 0}, {"key": "38673348ff28676905791fe3e8db2bbda814d974", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.12002563172036423, "ground_truth": 0}, {"key": "38673348ff28676905791fe3e8db2bbda814d974", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.13296424316511615, "ground_truth": 0}, {"key": "38673348ff28676905791fe3e8db2bbda814d974", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.10594827524541386, "ground_truth": 0}, {"key": "914a0163e25ecccb635b601837cc4dd552c66ce0", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.205615048617312, "ground_truth": 0}, {"key": "914a0163e25ecccb635b601837cc4dd552c66ce0", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.3647775560250268, "ground_truth": 0}, {"key": "914a0163e25ecccb635b601837cc4dd552c66ce0", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.36477755827880054, "ground_truth": 0}, {"key": "914a0163e25ecccb635b601837cc4dd552c66ce0", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.1699562241381783, "ground_truth": 0}, {"key": "914a0163e25ecccb635b601837cc4dd552c66ce0", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.29421499241955656, "ground_truth": 0}, {"key": "851c7314af56b6f47742970e11696948323dfe94", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.4590761309177329, "ground_truth": 0}, {"key": "851c7314af56b6f47742970e11696948323dfe94", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.3557748739255283, "ground_truth": 0}, {"key": "851c7314af56b6f47742970e11696948323dfe94", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.5448013730871352, "ground_truth": 0}, {"key": "851c7314af56b6f47742970e11696948323dfe94", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.3904758463952621, "ground_truth": 0}, {"key": "851c7314af56b6f47742970e11696948323dfe94", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.5117165762028556, "ground_truth": 0}, {"key": "f29f04e8f0615b768dd756c4387e87e27b7b4c2d", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.31236998572625035, "ground_truth": 0}, {"key": "f29f04e8f0615b768dd756c4387e87e27b7b4c2d", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.2877678008537505, "ground_truth": 0}, {"key": "f29f04e8f0615b768dd756c4387e87e27b7b4c2d", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.29746996103171774, "ground_truth": 0}, {"key": "f29f04e8f0615b768dd756c4387e87e27b7b4c2d", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.13028541970355484, "ground_truth": 0}, {"key": "f29f04e8f0615b768dd756c4387e87e27b7b4c2d", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.07211221130243761, "ground_truth": 0}, {"key": "8451164e86012e6dbf2fd39f7e6ca784ff9f3624", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.7138307761181119, "ground_truth": 0}, {"key": "8451164e86012e6dbf2fd39f7e6ca784ff9f3624", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.8354835184777871, "ground_truth": 0}, {"key": "8451164e86012e6dbf2fd39f7e6ca784ff9f3624", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.647798211759194, "ground_truth": 0}, {"key": "8451164e86012e6dbf2fd39f7e6ca784ff9f3624", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.618780416962941, "ground_truth": 0}, {"key": "8451164e86012e6dbf2fd39f7e6ca784ff9f3624", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.6893056357893955, "ground_truth": 0}, {"key": "18765fda59852b1c13eb226a2da9ab0979739f44", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.6688802429415329, "ground_truth": 0}, {"key": "18765fda59852b1c13eb226a2da9ab0979739f44", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.4551986199430497, "ground_truth": 0}, {"key": "18765fda59852b1c13eb226a2da9ab0979739f44", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.6893056371578887, "ground_truth": 0}, {"key": "18765fda59852b1c13eb226a2da9ab0979739f44", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.7505527549050963, "ground_truth": 0}, {"key": "18765fda59852b1c13eb226a2da9ab0979739f44", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.43974735067525733, "ground_truth": 0}, {"key": "fba410776268aaf447802e66ac94e4af54f7cb7a", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.6566582533069834, "ground_truth": 0}, {"key": "fba410776268aaf447802e66ac94e4af54f7cb7a", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.6370307850503376, "ground_truth": 0}, {"key": "fba410776268aaf447802e66ac94e4af54f7cb7a", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.3157359579534518, "ground_truth": 0}, {"key": "fba410776268aaf447802e66ac94e4af54f7cb7a", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.5117165971607984, "ground_truth": 0}, {"key": "fba410776268aaf447802e66ac94e4af54f7cb7a", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.40544873418860383, "ground_truth": 0}, {"key": "31494e5d6eda2042c4793ae68cea4b8304dfa0ad", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.7090191432098992, "ground_truth": 0}, {"key": "31494e5d6eda2042c4793ae68cea4b8304dfa0ad", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.8459424415070682, "ground_truth": 0}, {"key": "31494e5d6eda2042c4793ae68cea4b8304dfa0ad", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.7371581630523092, "ground_truth": 0}, {"key": "31494e5d6eda2042c4793ae68cea4b8304dfa0ad", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.7264255857572383, "ground_truth": 0}, {"key": "31494e5d6eda2042c4793ae68cea4b8304dfa0ad", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.9046505267630023, "ground_truth": 0}, {"key": "564bdb9bbcd2276bdfbdce6eb1e2058f0921bd82", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.28776784620886714, "ground_truth": 0}, {"key": "564bdb9bbcd2276bdfbdce6eb1e2058f0921bd82", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.5019531065431526, "ground_truth": 0}, {"key": "564bdb9bbcd2276bdfbdce6eb1e2058f0921bd82", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.6688802888927057, "ground_truth": 0}, {"key": "564bdb9bbcd2276bdfbdce6eb1e2058f0921bd82", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.2365162465073549, "ground_truth": 0}, {"key": "564bdb9bbcd2276bdfbdce6eb1e2058f0921bd82", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.49218813875984035, "ground_truth": 0}, {"key": "acbacec078274c02aeae06061357d02d950fec33", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.6859494532488153, "ground_truth": 0}, {"key": "acbacec078274c02aeae06061357d02d950fec33", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.3328523207127367, "ground_truth": 0}, {"key": "acbacec078274c02aeae06061357d02d950fec33", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.6548947344617692, "ground_truth": 0}, {"key": "acbacec078274c02aeae06061357d02d950fec33", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.5117165935958744, "ground_truth": 0}, {"key": "acbacec078274c02aeae06061357d02d950fec33", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.6169358180478117, "ground_truth": 0}, {"key": "04327bc3e426eee01ed61d369fd52415aa300ddc", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.27825679482163684, "ground_truth": 0}, {"key": "04327bc3e426eee01ed61d369fd52415aa300ddc", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.24364243860735754, "ground_truth": 0}, {"key": "04327bc3e426eee01ed61d369fd52415aa300ddc", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.3468730757663288, "ground_truth": 0}, {"key": "04327bc3e426eee01ed61d369fd52415aa300ddc", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.25091277333829515, "ground_truth": 0}, {"key": "04327bc3e426eee01ed61d369fd52415aa300ddc", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.24798742682964064, "ground_truth": 0}, {"key": "b1f3d2adb48370e5ecadff8e6e3baff407b01f0e", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.3575675176885401, "ground_truth": 0}, {"key": "b1f3d2adb48370e5ecadff8e6e3baff407b01f0e", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.1250653838566598, "ground_truth": 0}, {"key": "b1f3d2adb48370e5ecadff8e6e3baff407b01f0e", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.05146276683461777, "ground_truth": 0}, {"key": "b1f3d2adb48370e5ecadff8e6e3baff407b01f0e", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.11516222713116639, "ground_truth": 0}, {"key": "b1f3d2adb48370e5ecadff8e6e3baff407b01f0e", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.07316472418394754, "ground_truth": 0}, {"key": "d7eaf2e5ca91bf54c05ead867e5e90728d44e218", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.4649015811561338, "ground_truth": 0}, {"key": "d7eaf2e5ca91bf54c05ead867e5e90728d44e218", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.4960938557739412, "ground_truth": 0}, {"key": "d7eaf2e5ca91bf54c05ead867e5e90728d44e218", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.9155072482897031, "ground_truth": 0}, {"key": "d7eaf2e5ca91bf54c05ead867e5e90728d44e218", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.5506073653281804, "ground_truth": 0}, {"key": "d7eaf2e5ca91bf54c05ead867e5e90728d44e218", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.4111108522303886, "ground_truth": 0}, {"key": "1fcce9f667de2a14d76aaa6cdb3f1e6f7900e463", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.5907791930813487, "ground_truth": 0}, {"key": "1fcce9f667de2a14d76aaa6cdb3f1e6f7900e463", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.30569730874913315, "ground_truth": 0}, {"key": "1fcce9f667de2a14d76aaa6cdb3f1e6f7900e463", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.4436004343112596, "ground_truth": 0}, {"key": "1fcce9f667de2a14d76aaa6cdb3f1e6f7900e463", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.5717666109217594, "ground_truth": 0}, {"key": "1fcce9f667de2a14d76aaa6cdb3f1e6f7900e463", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.4863315316738792, "ground_truth": 0}, {"key": "892f75a4d31560b60aa588faa6f4bf51322b8c18", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.6406358524431173, "ground_truth": 0}, {"key": "892f75a4d31560b60aa588faa6f4bf51322b8c18", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.7648915977800661, "ground_truth": 0}, {"key": "892f75a4d31560b60aa588faa6f4bf51322b8c18", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.6113819712102617, "ground_truth": 0}, {"key": "892f75a4d31560b60aa588faa6f4bf51322b8c18", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.7248702627774046, "ground_truth": 0}, {"key": "892f75a4d31560b60aa588faa6f4bf51322b8c18", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.7431679931171558, "ground_truth": 0}, {"key": "acf12bd8d1142648b1b522a3a925e14e48b8f068", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.5234203348311026, "ground_truth": 0}, {"key": "acf12bd8d1142648b1b522a3a925e14e48b8f068", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.3504213899719455, "ground_truth": 0}, {"key": "acf12bd8d1142648b1b522a3a925e14e48b8f068", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.34864512706505496, "ground_truth": 0}, {"key": "acf12bd8d1142648b1b522a3a925e14e48b8f068", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.25091280461289134, "ground_truth": 0}, {"key": "acf12bd8d1142648b1b522a3a925e14e48b8f068", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.39233683241227485, "ground_truth": 0}, {"key": "c8caeb08b05cc56e1ac29146793ceb07e4c0de69", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.7233094522970462, "ground_truth": 0}, {"key": "c8caeb08b05cc56e1ac29146793ceb07e4c0de69", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.8128673230827715, "ground_truth": 0}, {"key": "c8caeb08b05cc56e1ac29146793ceb07e4c0de69", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.1480472143534909, "ground_truth": 0}, {"key": "c8caeb08b05cc56e1ac29146793ceb07e4c0de69", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.2568319999817755, "ground_truth": 0}, {"key": "c8caeb08b05cc56e1ac29146793ceb07e4c0de69", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.5350984478944962, "ground_truth": 0}, {"key": "ed7ed4440f5f7082230ae745d240350a4f20b8b7", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.2465333586426196, "ground_truth": 0}, {"key": "ed7ed4440f5f7082230ae745d240350a4f20b8b7", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.44552954147436136, "ground_truth": 0}, {"key": "ed7ed4440f5f7082230ae745d240350a4f20b8b7", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.4092207934722474, "ground_truth": 0}, {"key": "ed7ed4440f5f7082230ae745d240350a4f20b8b7", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.2598256080426602, "ground_truth": 0}, {"key": "ed7ed4440f5f7082230ae745d240350a4f20b8b7", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.22678362082897238, "ground_truth": 0}, {"key": "25b7adf8bfe43c2953a874b18c7766370158638a", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.19193278876533376, "ground_truth": 0}, {"key": "25b7adf8bfe43c2953a874b18c7766370158638a", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.4111108981784677, "ground_truth": 0}, {"key": "25b7adf8bfe43c2953a874b18c7766370158638a", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.19072401892370766, "ground_truth": 0}, {"key": "25b7adf8bfe43c2953a874b18c7766370158638a", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.26133091495987265, "ground_truth": 0}, {"key": "25b7adf8bfe43c2953a874b18c7766370158638a", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.6442251235650817, "ground_truth": 0}, {"key": "771c125e3b0c54f1c3367b2857f15d689f081163", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.7476159526212568, "ground_truth": 0}, {"key": "771c125e3b0c54f1c3367b2857f15d689f081163", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.6584175097000688, "ground_truth": 0}, {"key": "771c125e3b0c54f1c3367b2857f15d689f081163", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.5117166014330301, "ground_truth": 0}, {"key": "771c125e3b0c54f1c3367b2857f15d689f081163", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.6740504715294852, "ground_truth": 0}, {"key": "771c125e3b0c54f1c3367b2857f15d689f081163", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.7969253664965734, "ground_truth": 0}, {"key": "4ad70f84c363e5b594da00983e2b40600f12ca54", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.34158251482317264, "ground_truth": 0}, {"key": "4ad70f84c363e5b594da00983e2b40600f12ca54", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.5058591202380266, "ground_truth": 0}, {"key": "4ad70f84c363e5b594da00983e2b40600f12ca54", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.34687308152370033, "ground_truth": 0}, {"key": "4ad70f84c363e5b594da00983e2b40600f12ca54", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.5097643619319342, "ground_truth": 0}, {"key": "4ad70f84c363e5b594da00983e2b40600f12ca54", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.525368818795455, "ground_truth": 0}, {"key": "cbb5654e979eb27e0af71068cd4e4e5191df35ee", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.32594950934858463, "ground_truth": 0}, {"key": "cbb5654e979eb27e0af71068cd4e4e5191df35ee", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.49609383658033723, "ground_truth": 0}, {"key": "cbb5654e979eb27e0af71068cd4e4e5191df35ee", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.4378235196312089, "ground_truth": 0}, {"key": "cbb5654e979eb27e0af71068cd4e4e5191df35ee", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.5926665926055997, "ground_truth": 0}, {"key": "cbb5654e979eb27e0af71068cd4e4e5191df35ee", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.36116467479316416, "ground_truth": 0}, {"key": "bde6b7e505c05a15a9afe44739e7f016ce169735", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.12592276362647567, "ground_truth": 0}, {"key": "bde6b7e505c05a15a9afe44739e7f016ce169735", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.43014735136205573, "ground_truth": 0}, {"key": "bde6b7e505c05a15a9afe44739e7f016ce169735", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.3720487661089007, "ground_truth": 0}, {"key": "bde6b7e505c05a15a9afe44739e7f016ce169735", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.2309197669092101, "ground_truth": 0}, {"key": "bde6b7e505c05a15a9afe44739e7f016ce169735", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.2146914296621321, "ground_truth": 0}, {"key": "abc4744227c6bf0ddbf64cac2269bd4c6d02938b", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.3775406618643791, "ground_truth": 0}, {"key": "abc4744227c6bf0ddbf64cac2269bd4c6d02938b", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.38676344605128155, "ground_truth": 0}, {"key": "abc4744227c6bf0ddbf64cac2269bd4c6d02938b", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.28140558681393846, "ground_truth": 0}, {"key": "abc4744227c6bf0ddbf64cac2269bd4c6d02938b", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.2798284986759893, "ground_truth": 0}, {"key": "abc4744227c6bf0ddbf64cac2269bd4c6d02938b", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.16667540998037744, "ground_truth": 0}, {"key": "f7e5e75031e9f099564ed046bd822ef1bedb3188", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.3867634556744799, "ground_truth": 0}, {"key": "f7e5e75031e9f099564ed046bd822ef1bedb3188", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.4941409007975566, "ground_truth": 0}, {"key": "f7e5e75031e9f099564ed046bd822ef1bedb3188", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.336331045733649, "ground_truth": 0}, {"key": "f7e5e75031e9f099564ed046bd822ef1bedb3188", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.2958398472707169, "ground_truth": 0}, {"key": "f7e5e75031e9f099564ed046bd822ef1bedb3188", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.4073334191587529, "ground_truth": 0}, {"key": "9a8ee7eb582f293c617eecab5f37374d9400bb04", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.4687906478603567, "ground_truth": 0}, {"key": "9a8ee7eb582f293c617eecab5f37374d9400bb04", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.09467769819765233, "ground_truth": 0}, {"key": "9a8ee7eb582f293c617eecab5f37374d9400bb04", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.47657964498411426, "ground_truth": 0}, {"key": "9a8ee7eb582f293c617eecab5f37374d9400bb04", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.16559311835015453, "ground_truth": 0}, {"key": "9a8ee7eb582f293c617eecab5f37374d9400bb04", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.3486451161289127, "ground_truth": 0}, {"key": "a745e5a95be983cde00f3d472062c0627db3113c", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.10017220962545595, "ground_truth": 0}, {"key": "a745e5a95be983cde00f3d472062c0627db3113c", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.24508501357438975, "ground_truth": 0}, {"key": "a745e5a95be983cde00f3d472062c0627db3113c", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.08151975695014835, "ground_truth": 0}, {"key": "a745e5a95be983cde00f3d472062c0627db3113c", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.11124120699486964, "ground_truth": 0}, {"key": "a745e5a95be983cde00f3d472062c0627db3113c", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.1441488505381855, "ground_truth": 0}, {"key": "698cdb1268d4da1240d7f540bd4a5af4e229d00f", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.39047587463496425, "ground_truth": 0}, {"key": "698cdb1268d4da1240d7f540bd4a5af4e229d00f", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.2909808678455084, "ground_truth": 0}, {"key": "698cdb1268d4da1240d7f540bd4a5af4e229d00f", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.3793783834248096, "ground_truth": 0}, {"key": "698cdb1268d4da1240d7f540bd4a5af4e229d00f", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.22000708772014121, "ground_truth": 0}, {"key": "698cdb1268d4da1240d7f540bd4a5af4e229d00f", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.5717666017230089, "ground_truth": 0}, {"key": "708c903fbf6a7c3c84f84ff34496eb0cb51f44e4", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.13939637762881862, "ground_truth": 0}, {"key": "708c903fbf6a7c3c84f84ff34496eb0cb51f44e4", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.302391099214824, "ground_truth": 0}, {"key": "708c903fbf6a7c3c84f84ff34496eb0cb51f44e4", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.4610167807243602, "ground_truth": 0}, {"key": "708c903fbf6a7c3c84f84ff34496eb0cb51f44e4", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.1451153825294949, "ground_truth": 0}, {"key": "708c903fbf6a7c3c84f84ff34496eb0cb51f44e4", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.39420096211826766, "ground_truth": 0}, {"key": "26a1bafbde5cc970d5aee024dc8ef418587018a9", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.5602526851314558, "ground_truth": 0}, {"key": "26a1bafbde5cc970d5aee024dc8ef418587018a9", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.2643583599865586, "ground_truth": 0}, {"key": "26a1bafbde5cc970d5aee024dc8ef418587018a9", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.42823340741598764, "ground_truth": 0}, {"key": "26a1bafbde5cc970d5aee024dc8ef418587018a9", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.13386748550045596, "ground_truth": 0}, {"key": "26a1bafbde5cc970d5aee024dc8ef418587018a9", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.5679366137129045, "ground_truth": 0}, {"key": "6832312991fe5d87d0e300374ec7a699a921f06a", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.11757214588034823, "ground_truth": 0}, {"key": "6832312991fe5d87d0e300374ec7a699a921f06a", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.3363310376728476, "ground_truth": 0}, {"key": "6832312991fe5d87d0e300374ec7a699a921f06a", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.13386747571020188, "ground_truth": 0}, {"key": "6832312991fe5d87d0e300374ec7a699a921f06a", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.1847674995467497, "ground_truth": 0}, {"key": "6832312991fe5d87d0e300374ec7a699a921f06a", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.5679366090992263, "ground_truth": 0}, {"key": "9c5d5d672c2549a594b801897a27dde1492e11d5", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.29746992625315016, "ground_truth": 0}, {"key": "9c5d5d672c2549a594b801897a27dde1492e11d5", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.24653333312109432, "ground_truth": 0}, {"key": "9c5d5d672c2549a594b801897a27dde1492e11d5", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.7233094684165794, "ground_truth": 0}, {"key": "9c5d5d672c2549a594b801897a27dde1492e11d5", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.3702253973088031, "ground_truth": 0}, {"key": "9c5d5d672c2549a594b801897a27dde1492e11d5", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.6424324676436938, "ground_truth": 0}, {"key": "c32fa9084fe8cd565890a940794e505d5f7ba4c2", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.35220176191498215, "ground_truth": 0}, {"key": "c32fa9084fe8cd565890a940794e505d5f7ba4c2", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.2005576755558251, "ground_truth": 0}, {"key": "c32fa9084fe8cd565890a940794e505d5f7ba4c2", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.29746993331025723, "ground_truth": 0}, {"key": "c32fa9084fe8cd565890a940794e505d5f7ba4c2", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.3757064827619046, "ground_truth": 0}, {"key": "c32fa9084fe8cd565890a940794e505d5f7ba4c2", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.15304217112589855, "ground_truth": 0}, {"key": "41b5dd6064864c16fbde9b46d37c9f7d9a56e705", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.5292633695971322, "ground_truth": 0}, {"key": "41b5dd6064864c16fbde9b46d37c9f7d9a56e705", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.7170118974194998, "ground_truth": 0}, {"key": "41b5dd6064864c16fbde9b46d37c9f7d9a56e705", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.44552953935126044, "ground_truth": 0}, {"key": "41b5dd6064864c16fbde9b46d37c9f7d9a56e705", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.39606815858264033, "ground_truth": 0}, {"key": "41b5dd6064864c16fbde9b46d37c9f7d9a56e705", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.4980468872333961, "ground_truth": 0}, {"key": "b2d3ba739af767da7aa25c3ba8e1d186168c3394", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.7325918260026107, "ground_truth": 0}, {"key": "b2d3ba739af767da7aa25c3ba8e1d186168c3394", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.426321612020739, "ground_truth": 0}, {"key": "b2d3ba739af767da7aa25c3ba8e1d186168c3394", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.6388352984550154, "ground_truth": 0}, {"key": "b2d3ba739af767da7aa25c3ba8e1d186168c3394", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.5888891051590533, "ground_truth": 0}, {"key": "b2d3ba739af767da7aa25c3ba8e1d186168c3394", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.7931059446662565, "ground_truth": 0}, {"key": "519fd9b5c5ca82979cdfee3c990c3590838d93c7", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.35398628119601766, "ground_truth": 0}, {"key": "519fd9b5c5ca82979cdfee3c990c3590838d93c7", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.5525396777904202, "ground_truth": 0}, {"key": "519fd9b5c5ca82979cdfee3c990c3590838d93c7", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.25683198440800414, "ground_truth": 0}, {"key": "519fd9b5c5ca82979cdfee3c990c3590838d93c7", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.13660837400997403, "ground_truth": 0}, {"key": "519fd9b5c5ca82979cdfee3c990c3590838d93c7", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.5448013873679066, "ground_truth": 0}, {"key": "60f518dff20b2936b104035b1fd9584dd7d16def", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.5058590895210916, "ground_truth": 0}, {"key": "60f518dff20b2936b104035b1fd9584dd7d16def", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.38306415084295203, "ground_truth": 0}, {"key": "60f518dff20b2936b104035b1fd9584dd7d16def", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.3886180194473977, "ground_truth": 0}, {"key": "60f518dff20b2936b104035b1fd9584dd7d16def", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.46684562492098336, "ground_truth": 0}, {"key": "60f518dff20b2936b104035b1fd9584dd7d16def", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.3702254142225491, "ground_truth": 0}, {"key": "b82546b760716f0a2b26606b07af0fe0dd61d6ff", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.4263215767784708, "ground_truth": 0}, {"key": "b82546b760716f0a2b26606b07af0fe0dd61d6ff", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.6388352805706798, "ground_truth": 0}, {"key": "b82546b760716f0a2b26606b07af0fe0dd61d6ff", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.5273165299137565, "ground_truth": 0}, {"key": "b82546b760716f0a2b26606b07af0fe0dd61d6ff", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.33285231698879236, "ground_truth": 0}, {"key": "b82546b760716f0a2b26606b07af0fe0dd61d6ff", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.5253688300005283, "ground_truth": 0}, {"key": "7990fde4a924299fab79f6c8e2b447ee5ffcd1fc", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.11357958851946962, "ground_truth": 0}, {"key": "7990fde4a924299fab79f6c8e2b447ee5ffcd1fc", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.10669059479693904, "ground_truth": 0}, {"key": "7990fde4a924299fab79f6c8e2b447ee5ffcd1fc", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.16885695939289433, "ground_truth": 0}, {"key": "7990fde4a924299fab79f6c8e2b447ee5ffcd1fc", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.09670579419234371, "ground_truth": 0}, {"key": "7990fde4a924299fab79f6c8e2b447ee5ffcd1fc", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.18832397231034512, "ground_truth": 0}, {"key": "504f6f6e1aea6bb73c728d12a1342faa6828aace", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.9849273709736622, "ground_truth": 0}, {"key": "504f6f6e1aea6bb73c728d12a1342faa6828aace", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.9645892676856694, "ground_truth": 0}, {"key": "504f6f6e1aea6bb73c728d12a1342faa6828aace", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.9039745150418587, "ground_truth": 0}, {"key": "504f6f6e1aea6bb73c728d12a1342faa6828aace", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.991554373516022, "ground_truth": 0}, {"key": "504f6f6e1aea6bb73c728d12a1342faa6828aace", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.9284087994303657, "ground_truth": 0}, {"key": "ef42653bf9337de184e74be0160b807a41b526fd", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.9790357566095275, "ground_truth": 0}, {"key": "ef42653bf9337de184e74be0160b807a41b526fd", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.9742394392434962, "ground_truth": 0}, {"key": "ef42653bf9337de184e74be0160b807a41b526fd", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.9500414814386612, "ground_truth": 0}, {"key": "ef42653bf9337de184e74be0160b807a41b526fd", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.9449947128837363, "ground_truth": 0}, {"key": "ef42653bf9337de184e74be0160b807a41b526fd", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.961533808925469, "ground_truth": 0}, {"key": "26d0a5624f3ee7605833c641da5d88e2259b1162", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.5698526737514363, "ground_truth": 0}, {"key": "26d0a5624f3ee7605833c641da5d88e2259b1162", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.4130035590732593, "ground_truth": 0}, {"key": "26d0a5624f3ee7605833c641da5d88e2259b1162", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.29098085523579265, "ground_truth": 0}, {"key": "26d0a5624f3ee7605833c641da5d88e2259b1162", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.23651621773828457, "ground_truth": 0}, {"key": "26d0a5624f3ee7605833c641da5d88e2259b1162", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.30239107704097673, "ground_truth": 0}, {"key": "7e43e9a2c67829721ff9f68147285c579e2c8a70", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.16451647257173824, "ground_truth": 0}, {"key": "7e43e9a2c67829721ff9f68147285c579e2c8a70", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.4668455879797982, "ground_truth": 0}, {"key": "7e43e9a2c67829721ff9f68147285c579e2c8a70", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.28616926076780796, "ground_truth": 0}, {"key": "7e43e9a2c67829721ff9f68147285c579e2c8a70", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.16995623760894432, "ground_truth": 0}, {"key": "7e43e9a2c67829721ff9f68147285c579e2c8a70", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.42441196861808056, "ground_truth": 0}, {"key": "2137ee3e39b5c0d12e17bbd1e10eb75495a3a83b", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.25683196130395985, "ground_truth": 0}, {"key": "2137ee3e39b5c0d12e17bbd1e10eb75495a3a83b", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.19806417080851732, "ground_truth": 0}, {"key": "2137ee3e39b5c0d12e17bbd1e10eb75495a3a83b", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.042403826681430765, "ground_truth": 0}, {"key": "2137ee3e39b5c0d12e17bbd1e10eb75495a3a83b", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.041462271685122544, "ground_truth": 0}, {"key": "2137ee3e39b5c0d12e17bbd1e10eb75495a3a83b", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.15203223341513047, "ground_truth": 0}, {"key": "31defcc44013caae59c0bdbcedd16be150413bd5", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.47268345787717597, "ground_truth": 0}, {"key": "31defcc44013caae59c0bdbcedd16be150413bd5", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.5755879995893873, "ground_truth": 0}, {"key": "31defcc44013caae59c0bdbcedd16be150413bd5", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.433981465323889, "ground_truth": 0}, {"key": "31defcc44013caae59c0bdbcedd16be150413bd5", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.4130035871098559, "ground_truth": 0}, {"key": "31defcc44013caae59c0bdbcedd16be150413bd5", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.2782567681693621, "ground_truth": 0}, {"key": "db73dc3466e4e92672d716c1eb2ac9430ac69951", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.550607360929755, "ground_truth": 0}, {"key": "db73dc3466e4e92672d716c1eb2ac9430ac69951", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.672331690655616, "ground_truth": 0}, {"key": "db73dc3466e4e92672d716c1eb2ac9430ac69951", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.5058590967824705, "ground_truth": 0}, {"key": "db73dc3466e4e92672d716c1eb2ac9430ac69951", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.7138307523129656, "ground_truth": 0}, {"key": "db73dc3466e4e92672d716c1eb2ac9430ac69951", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.3867634229043719, "ground_truth": 0}, {"key": "3f6308f2f5b6ccdb89d7b6abe1b9490cc30b8e5f", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.21076629963986204, "ground_truth": 0}, {"key": "3f6308f2f5b6ccdb89d7b6abe1b9490cc30b8e5f", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.22815650677877725, "ground_truth": 0}, {"key": "3f6308f2f5b6ccdb89d7b6abe1b9490cc30b8e5f", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.3486451545409547, "ground_truth": 0}, {"key": "3f6308f2f5b6ccdb89d7b6abe1b9490cc30b8e5f", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.3738758353710271, "ground_truth": 0}, {"key": "3f6308f2f5b6ccdb89d7b6abe1b9490cc30b8e5f", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.18010666287240962, "ground_truth": 0}, {"key": "068d37f7a1ee822245dbf9d0d8ddfc281919d7ee", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.14318771369592861, "ground_truth": 0}, {"key": "068d37f7a1ee822245dbf9d0d8ddfc281919d7ee", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.08756383896860313, "ground_truth": 0}, {"key": "068d37f7a1ee822245dbf9d0d8ddfc281919d7ee", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.06954173929991318, "ground_truth": 0}, {"key": "068d37f7a1ee822245dbf9d0d8ddfc281919d7ee", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.1320661606254353, "ground_truth": 0}, {"key": "068d37f7a1ee822245dbf9d0d8ddfc281919d7ee", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.20689403192978137, "ground_truth": 0}, {"key": "bb1e2c23f3fc6edb0ee4bed365cb5567c87a5aa9", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.459076124142805, "ground_truth": 0}, {"key": "bb1e2c23f3fc6edb0ee4bed365cb5567c87a5aa9", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.3539862920794319, "ground_truth": 0}, {"key": "bb1e2c23f3fc6edb0ee4bed365cb5567c87a5aa9", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.3345894502593545, "ground_truth": 0}, {"key": "bb1e2c23f3fc6edb0ee4bed365cb5567c87a5aa9", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.195594081292964, "ground_truth": 0}, {"key": "bb1e2c23f3fc6edb0ee4bed365cb5567c87a5aa9", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.4610168020192303, "ground_truth": 0}, {"key": "7c72b57e65ddefc77362ed64f7dbc0aebb87ac81", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.9289263228551675, "ground_truth": 0}, {"key": "7c72b57e65ddefc77362ed64f7dbc0aebb87ac81", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.9462003555180967, "ground_truth": 0}, {"key": "7c72b57e65ddefc77362ed64f7dbc0aebb87ac81", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.8840392944511598, "ground_truth": 0}, {"key": "7c72b57e65ddefc77362ed64f7dbc0aebb87ac81", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.9629528327635711, "ground_truth": 0}, {"key": "7c72b57e65ddefc77362ed64f7dbc0aebb87ac81", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.9111797079447765, "ground_truth": 0}, {"key": "37a335b36b8d2472825c4624e5449b995726b7a3", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.07211220731517562, "ground_truth": 0}, {"key": "37a335b36b8d2472825c4624e5449b995726b7a3", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.06512754712200079, "ground_truth": 0}, {"key": "37a335b36b8d2472825c4624e5449b995726b7a3", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.07807816790275461, "ground_truth": 0}, {"key": "37a335b36b8d2472825c4624e5449b995726b7a3", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.05108273432088966, "ground_truth": 0}, {"key": "37a335b36b8d2472825c4624e5449b995726b7a3", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.05623634389107718, "ground_truth": 0}, {"key": "da894eb6e5cc104f90ac65e8a124bfcfbfc6578d", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.18010665086365643, "ground_truth": 0}, {"key": "da894eb6e5cc104f90ac65e8a124bfcfbfc6578d", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.5136684960665708, "ground_truth": 0}, {"key": "da894eb6e5cc104f90ac65e8a124bfcfbfc6578d", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.12252322492307327, "ground_truth": 0}, {"key": "da894eb6e5cc104f90ac65e8a124bfcfbfc6578d", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.3311197290558522, "ground_truth": 0}, {"key": "da894eb6e5cc104f90ac65e8a124bfcfbfc6578d", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.3923368349408841, "ground_truth": 0}, {"key": "b7697e424512e656efe5f2aca17bc33cfe0a2b20", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.5660185194585341, "ground_truth": 0}, {"key": "b7697e424512e656efe5f2aca17bc33cfe0a2b20", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.3998116396240062, "ground_truth": 0}, {"key": "b7697e424512e656efe5f2aca17bc33cfe0a2b20", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.4746311808891469, "ground_truth": 0}, {"key": "b7697e424512e656efe5f2aca17bc33cfe0a2b20", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.5698526487880577, "ground_truth": 0}, {"key": "b7697e424512e656efe5f2aca17bc33cfe0a2b20", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.6169357927917972, "ground_truth": 0}, {"key": "2292d4348e59aafbe93f3040af23fdff448a6cac", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.7025300452553553, "ground_truth": 0}, {"key": "2292d4348e59aafbe93f3040af23fdff448a6cac", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.7534666502252413, "ground_truth": 0}, {"key": "2292d4348e59aafbe93f3040af23fdff448a6cac", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.6279512033637928, "ground_truth": 0}, {"key": "2292d4348e59aafbe93f3040af23fdff448a6cac", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.24508497333134177, "ground_truth": 0}, {"key": "2292d4348e59aafbe93f3040af23fdff448a6cac", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.3775406547229702, "ground_truth": 0}, {"key": "8ed7e0c5e15275537f2c1d5d945e95709d7dc6bf", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.41300356343652567, "ground_truth": 0}, {"key": "8ed7e0c5e15275537f2c1d5d945e95709d7dc6bf", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.43590152864845233, "ground_truth": 0}, {"key": "8ed7e0c5e15275537f2c1d5d945e95709d7dc6bf", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.466845610860623, "ground_truth": 0}, {"key": "8ed7e0c5e15275537f2c1d5d945e95709d7dc6bf", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.23510838465559736, "ground_truth": 0}, {"key": "8ed7e0c5e15275537f2c1d5d945e95709d7dc6bf", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.5755880133898612, "ground_truth": 0}, {"key": "6b22be31a2cefb2fdd302b8ff788335f23f5dbad", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.2509127851028567, "ground_truth": 0}, {"key": "6b22be31a2cefb2fdd302b8ff788335f23f5dbad", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.3174262703891765, "ground_truth": 0}, {"key": "6b22be31a2cefb2fdd302b8ff788335f23f5dbad", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.26740815881788416, "ground_truth": 0}, {"key": "6b22be31a2cefb2fdd302b8ff788335f23f5dbad", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.21076629987391746, "ground_truth": 0}, {"key": "6b22be31a2cefb2fdd302b8ff788335f23f5dbad", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.20946969183635705, "ground_truth": 0}, {"key": "686caba1039a286aca406e0bbac00aebb198fda5", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.6076631896148696, "ground_truth": 0}, {"key": "686caba1039a286aca406e0bbac00aebb198fda5", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.5039061673099144, "ground_truth": 0}, {"key": "686caba1039a286aca406e0bbac00aebb198fda5", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.6370307788848824, "ground_truth": 0}, {"key": "686caba1039a286aca406e0bbac00aebb198fda5", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.6076631839043766, "ground_truth": 0}, {"key": "686caba1039a286aca406e0bbac00aebb198fda5", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.5640984874804454, "ground_truth": 0}, {"key": "3c84e13d5941fdbe626183cdf1dca9b5df6c8f92", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.2814056303492567, "ground_truth": 0}, {"key": "3c84e13d5941fdbe626183cdf1dca9b5df6c8f92", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.29910518241850886, "ground_truth": 0}, {"key": "3c84e13d5941fdbe626183cdf1dca9b5df6c8f92", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.4073333861633751, "ground_truth": 0}, {"key": "3c84e13d5941fdbe626183cdf1dca9b5df6c8f92", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.2598256417317794, "ground_truth": 0}, {"key": "3c84e13d5941fdbe626183cdf1dca9b5df6c8f92", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.17553806688350743, "ground_truth": 0}, {"key": "7f5fd7614f32586747f65545bebba418c3679d12", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.39047583438342376, "ground_truth": 0}, {"key": "7f5fd7614f32586747f65545bebba418c3679d12", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.3629692162931616, "ground_truth": 0}, {"key": "7f5fd7614f32586747f65545bebba418c3679d12", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.38306415929245075, "ground_truth": 0}, {"key": "7f5fd7614f32586747f65545bebba418c3679d12", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.2674081922764969, "ground_truth": 0}, {"key": "7f5fd7614f32586747f65545bebba418c3679d12", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.3867634732178707, "ground_truth": 0}, {"key": "186210bbc060c272ff9a2412ec2e711a3e4a5e6e", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.2240554442640255, "ground_truth": 0}, {"key": "186210bbc060c272ff9a2412ec2e711a3e4a5e6e", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.36116470093244774, "ground_truth": 0}, {"key": "186210bbc060c272ff9a2412ec2e711a3e4a5e6e", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.08819003381389495, "ground_truth": 0}, {"key": "186210bbc060c272ff9a2412ec2e711a3e4a5e6e", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.17553806450588513, "ground_truth": 0}, {"key": "186210bbc060c272ff9a2412ec2e711a3e4a5e6e", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.22953522677936186, "ground_truth": 0}, {"key": "03392835ea832d7940082c421a21778c70701ff0", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.09602548015614357, "ground_truth": 0}, {"key": "03392835ea832d7940082c421a21778c70701ff0", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.36116470093244774, "ground_truth": 0}, {"key": "03392835ea832d7940082c421a21778c70701ff0", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.19314739158777128, "ground_truth": 0}, {"key": "03392835ea832d7940082c421a21778c70701ff0", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.1431877139162341, "ground_truth": 0}, {"key": "03392835ea832d7940082c421a21778c70701ff0", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.152032249970658, "ground_truth": 0}, {"key": "e2b96982b60cbd10b39c1db4282023d0ac1f3f2a", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.4746311786428177, "ground_truth": 0}, {"key": "e2b96982b60cbd10b39c1db4282023d0ac1f3f2a", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.3106943814631961, "ground_truth": 0}, {"key": "e2b96982b60cbd10b39c1db4282023d0ac1f3f2a", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.14903529212106176, "ground_truth": 0}, {"key": "e2b96982b60cbd10b39c1db4282023d0ac1f3f2a", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.27982847654994647, "ground_truth": 0}, {"key": "e2b96982b60cbd10b39c1db4282023d0ac1f3f2a", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.24364245051001981, "ground_truth": 0}, {"key": "31310358d02c98abba71916e8cb4ef7477a2d82a", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.18952110287896118, "ground_truth": 0}, {"key": "31310358d02c98abba71916e8cb4ef7477a2d82a", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.5039061495071119, "ground_truth": 0}, {"key": "31310358d02c98abba71916e8cb4ef7477a2d82a", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.17441027335438297, "ground_truth": 0}, {"key": "31310358d02c98abba71916e8cb4ef7477a2d82a", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.13117322782210392, "ground_truth": 0}, {"key": "31310358d02c98abba71916e8cb4ef7477a2d82a", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.19806417530198897, "ground_truth": 0}, {"key": "ec0e9a0c77bbb4bba73ef5177413c666e691850d", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.5888891462500077, "ground_truth": 0}, {"key": "ec0e9a0c77bbb4bba73ef5177413c666e691850d", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.7534666502252413, "ground_truth": 0}, {"key": "ec0e9a0c77bbb4bba73ef5177413c666e691850d", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.36477753260216683, "ground_truth": 0}, {"key": "ec0e9a0c77bbb4bba73ef5177413c666e691850d", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.43590151307802144, "ground_truth": 0}, {"key": "ec0e9a0c77bbb4bba73ef5177413c666e691850d", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.5409238930596486, "ground_truth": 0}, {"key": "02311be4aab97a81d2262963896b975c27f6503d", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.45907615333066365, "ground_truth": 0}, {"key": "02311be4aab97a81d2262963896b975c27f6503d", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.41111086110988054, "ground_truth": 0}, {"key": "02311be4aab97a81d2262963896b975c27f6503d", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.42441201022745995, "ground_truth": 0}, {"key": "02311be4aab97a81d2262963896b975c27f6503d", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.6406358570221041, "ground_truth": 0}, {"key": "02311be4aab97a81d2262963896b975c27f6503d", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.5964331369009329, "ground_truth": 0}, {"key": "a18b463219c663ef55a0cbbf81ae489cdf877b62", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.7505527587168981, "ground_truth": 0}, {"key": "a18b463219c663ef55a0cbbf81ae489cdf877b62", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.9559813522430846, "ground_truth": 0}, {"key": "a18b463219c663ef55a0cbbf81ae489cdf877b62", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.9606574920231962, "ground_truth": 0}, {"key": "a18b463219c663ef55a0cbbf81ae489cdf877b62", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.9403530519736133, "ground_truth": 0}, {"key": "a18b463219c663ef55a0cbbf81ae489cdf877b62", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.7745833954323493, "ground_truth": 0}, {"key": "aa966ac9e3611ac2cef8d3fb9ceb3b58c150e238", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.870597271618955, "ground_truth": 0}, {"key": "aa966ac9e3611ac2cef8d3fb9ceb3b58c150e238", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.6842640383532971, "ground_truth": 0}, {"key": "aa966ac9e3611ac2cef8d3fb9ceb3b58c150e238", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.7866228213281359, "ground_truth": 0}, {"key": "aa966ac9e3611ac2cef8d3fb9ceb3b58c150e238", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.6566582882021831, "ground_truth": 0}, {"key": "aa966ac9e3611ac2cef8d3fb9ceb3b58c150e238", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.8128673215861241, "ground_truth": 0}, {"key": "5215d4e6e945ba390786f1720cc5a8abf92c32fd", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.2422056442816614, "ground_truth": 0}, {"key": "5215d4e6e945ba390786f1720cc5a8abf92c32fd", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.16451647238537256, "ground_truth": 0}, {"key": "5215d4e6e945ba390786f1720cc5a8abf92c32fd", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.26284183604452743, "ground_truth": 0}, {"key": "5215d4e6e945ba390786f1720cc5a8abf92c32fd", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.31912138221527664, "ground_truth": 0}, {"key": "5215d4e6e945ba390786f1720cc5a8abf92c32fd", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.4092208122071699, "ground_truth": 0}, {"key": "e7297f59909379c8eb07ea9bc2377b5e3980073d", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.09334687205044463, "ground_truth": 0}, {"key": "e7297f59909379c8eb07ea9bc2377b5e3980073d", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.06512754712200079, "ground_truth": 0}, {"key": "e7297f59909379c8eb07ea9bc2377b5e3980073d", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.05146276668810585, "ground_truth": 0}, {"key": "e7297f59909379c8eb07ea9bc2377b5e3980073d", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.057493287661126366, "ground_truth": 0}, {"key": "e7297f59909379c8eb07ea9bc2377b5e3980073d", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.05623634389107718, "ground_truth": 0}, {"key": "6c5f775006a225e617c1fa4cf0c439579e1443a2", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.5273165236554184, "ground_truth": 0}, {"key": "6c5f775006a225e617c1fa4cf0c439579e1443a2", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.6334102396011575, "ground_truth": 0}, {"key": "6c5f775006a225e617c1fa4cf0c439579e1443a2", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.7732163785718708, "ground_truth": 0}, {"key": "6c5f775006a225e617c1fa4cf0c439579e1443a2", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.49218814962830865, "ground_truth": 0}, {"key": "6c5f775006a225e617c1fa4cf0c439579e1443a2", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.8558511533335298, "ground_truth": 0}, {"key": "46ce664a42eac4474d25c435a28790ec25137603", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.299105176971185, "ground_truth": 0}, {"key": "46ce664a42eac4474d25c435a28790ec25137603", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.4263215919037627, "ground_truth": 0}, {"key": "46ce664a42eac4474d25c435a28790ec25137603", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.35936413318329224, "ground_truth": 0}, {"key": "46ce664a42eac4474d25c435a28790ec25137603", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.27669053812115213, "ground_truth": 0}, {"key": "46ce664a42eac4474d25c435a28790ec25137603", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.5964331456106127, "ground_truth": 0}, {"key": "693d73ab049f7d8f3c897922b3f7269a96a1a4fa", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.5214711641553338, "ground_truth": 0}, {"key": "693d73ab049f7d8f3c897922b3f7269a96a1a4fa", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.7690802247683631, "ground_truth": 0}, {"key": "693d73ab049f7d8f3c897922b3f7269a96a1a4fa", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.6095241850130395, "ground_truth": 0}, {"key": "693d73ab049f7d8f3c897922b3f7269a96a1a4fa", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.6495786414198585, "ground_truth": 0}, {"key": "693d73ab049f7d8f3c897922b3f7269a96a1a4fa", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.44167302629324356, "ground_truth": 0}, {"key": "48e4930e3c380330b609f460f11520be0e29d5fd", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.4359015286687545, "ground_truth": 0}, {"key": "48e4930e3c380330b609f460f11520be0e29d5fd", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.8587185873633604, "ground_truth": 0}, {"key": "48e4930e3c380330b609f460f11520be0e29d5fd", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.2704802158171495, "ground_truth": 0}, {"key": "48e4930e3c380330b609f460f11520be0e29d5fd", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.2351083859078013, "ground_truth": 0}, {"key": "48e4930e3c380330b609f460f11520be0e29d5fd", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.38306414767735486, "ground_truth": 0}, {"key": "53f3e11ada213ff55b987692a2eb0c9b6d890d5e", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.6279512223371685, "ground_truth": 0}, {"key": "53f3e11ada213ff55b987692a2eb0c9b6d890d5e", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.4629586081446307, "ground_truth": 0}, {"key": "53f3e11ada213ff55b987692a2eb0c9b6d890d5e", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.2628418292814139, "ground_truth": 0}, {"key": "53f3e11ada213ff55b987692a2eb0c9b6d890d5e", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.5273165320697324, "ground_truth": 0}, {"key": "53f3e11ada213ff55b987692a2eb0c9b6d890d5e", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.26284182628064967, "ground_truth": 0}, {"key": "d2ee859acf7e35bea229f968d53240c2f1c2845c", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.6113819881836884, "ground_truth": 0}, {"key": "d2ee859acf7e35bea229f968d53240c2f1c2845c", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.377540654987903, "ground_truth": 0}, {"key": "d2ee859acf7e35bea229f968d53240c2f1c2845c", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.42059959739071007, "ground_truth": 0}, {"key": "d2ee859acf7e35bea229f968d53240c2f1c2845c", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.5945512466610818, "ground_truth": 0}, {"key": "d2ee859acf7e35bea229f968d53240c2f1c2845c", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.3611647311266854, "ground_truth": 0}, {"key": "d4d44650eb77504fd01a730c0ccc7e6cdfcc578a", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.31405054374062585, "ground_truth": 0}, {"key": "d4d44650eb77504fd01a730c0ccc7e6cdfcc578a", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.4148988518419976, "ground_truth": 0}, {"key": "d4d44650eb77504fd01a730c0ccc7e6cdfcc578a", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.23231014185281856, "ground_truth": 0}, {"key": "d4d44650eb77504fd01a730c0ccc7e6cdfcc578a", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.32252598041556185, "ground_truth": 0}, {"key": "d4d44650eb77504fd01a730c0ccc7e6cdfcc578a", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.32939173886300893, "ground_truth": 0}, {"key": "3695132378151f89d210da575bfef0a3f29aa051", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.7371581800953996, "ground_truth": 0}, {"key": "3695132378151f89d210da575bfef0a3f29aa051", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.6943026761943213, "ground_truth": 0}, {"key": "3695132378151f89d210da575bfef0a3f29aa051", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.8289388148946376, "ground_truth": 0}, {"key": "3695132378151f89d210da575bfef0a3f29aa051", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.7676898424460527, "ground_truth": 0}, {"key": "3695132378151f89d210da575bfef0a3f29aa051", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.5467381480961356, "ground_truth": 0}, {"key": "c193cecd478fa204b16500ece25bf25b75bc5265", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.2200071035954099, "ground_truth": 0}, {"key": "c193cecd478fa204b16500ece25bf25b75bc5265", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.28937169947671, "ground_truth": 0}, {"key": "c193cecd478fa204b16500ece25bf25b75bc5265", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.26133091833741184, "ground_truth": 0}, {"key": "c193cecd478fa204b16500ece25bf25b75bc5265", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.15713685881780762, "ground_truth": 0}, {"key": "c193cecd478fa204b16500ece25bf25b75bc5265", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.33633103716035073, "ground_truth": 0}, {"key": "b599d61b0c28b86dc92c7af4d40814ece8279500", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.4765796594635098, "ground_truth": 0}, {"key": "b599d61b0c28b86dc92c7af4d40814ece8279500", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.637030791243226, "ground_truth": 0}, {"key": "b599d61b0c28b86dc92c7af4d40814ece8279500", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.5660185340469717, "ground_truth": 0}, {"key": "b599d61b0c28b86dc92c7af4d40814ece8279500", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.3504213926639692, "ground_truth": 0}, {"key": "b599d61b0c28b86dc92c7af4d40814ece8279500", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.35220176665112707, "ground_truth": 0}, {"key": "06f290a163e81c46437ca61b5fd13741d7db11f2", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.18126320660235576, "ground_truth": 0}, {"key": "06f290a163e81c46437ca61b5fd13741d7db11f2", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.40168779648763525, "ground_truth": 0}, {"key": "06f290a163e81c46437ca61b5fd13741d7db11f2", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.20561504421379037, "ground_truth": 0}, {"key": "06f290a163e81c46437ca61b5fd13741d7db11f2", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.15203223669299223, "ground_truth": 0}, {"key": "06f290a163e81c46437ca61b5fd13741d7db11f2", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.1008786322273583, "ground_truth": 0}, {"key": "46210bd0b15cd5bba64751d873674766decb2677", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.2942149694171655, "ground_truth": 0}, {"key": "46210bd0b15cd5bba64751d873674766decb2677", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.46490159485550164, "ground_truth": 0}, {"key": "46210bd0b15cd5bba64751d873674766decb2677", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.5234203336456202, "ground_truth": 0}, {"key": "46210bd0b15cd5bba64751d873674766decb2677", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.2704801989397993, "ground_truth": 0}, {"key": "46210bd0b15cd5bba64751d873674766decb2677", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.3380771296282857, "ground_truth": 0}, {"key": "cfba701dad16c47e0f7b97b8a6b043d25f740085", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.19806418046584934, "ground_truth": 0}, {"key": "cfba701dad16c47e0f7b97b8a6b043d25f740085", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.3242353876904887, "ground_truth": 0}, {"key": "cfba701dad16c47e0f7b97b8a6b043d25f740085", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.38306416234391916, "ground_truth": 0}, {"key": "cfba701dad16c47e0f7b97b8a6b043d25f740085", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.5350984762398248, "ground_truth": 0}, {"key": "cfba701dad16c47e0f7b97b8a6b043d25f740085", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.24220562445461086, "ground_truth": 0}, {"key": "1c0fbe7e6758334d83d145580688e7aa1c549c53", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.23651624019150191, "ground_truth": 0}, {"key": "1c0fbe7e6758334d83d145580688e7aa1c549c53", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.23651622277130455, "ground_truth": 0}, {"key": "1c0fbe7e6758334d83d145580688e7aa1c549c53", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.17781087069413143, "ground_truth": 0}, {"key": "1c0fbe7e6758334d83d145580688e7aa1c549c53", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.25683198667489654, "ground_truth": 0}, {"key": "1c0fbe7e6758334d83d145580688e7aa1c549c53", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.3328523179744766, "ground_truth": 0}, {"key": "820c917dada8b32be365eaeec9edc1ca5833cfcd", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.8031737851665723, "ground_truth": 0}, {"key": "820c917dada8b32be365eaeec9edc1ca5833cfcd", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.43206340917645125, "ground_truth": 0}, {"key": "820c917dada8b32be365eaeec9edc1ca5833cfcd", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.7866228250888045, "ground_truth": 0}, {"key": "820c917dada8b32be365eaeec9edc1ca5833cfcd", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.6334102734549173, "ground_truth": 0}, {"key": "820c917dada8b32be365eaeec9edc1ca5833cfcd", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.5389832247606443, "ground_truth": 0}, {"key": "faf3821150b0c63290cbbddd7a8b54900995ea5a", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.3504213880961241, "ground_truth": 0}, {"key": "faf3821150b0c63290cbbddd7a8b54900995ea5a", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.5175708956102839, "ground_truth": 0}, {"key": "faf3821150b0c63290cbbddd7a8b54900995ea5a", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.6654105631150862, "ground_truth": 0}, {"key": "faf3821150b0c63290cbbddd7a8b54900995ea5a", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.6315942661566585, "ground_truth": 0}, {"key": "faf3821150b0c63290cbbddd7a8b54900995ea5a", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.5389832236114341, "ground_truth": 0}, {"key": "1de0cae2832cf41f49e6fad8254247c789dfabd2", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.445529543748174, "ground_truth": 0}, {"key": "1de0cae2832cf41f49e6fad8254247c789dfabd2", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.3593641422384992, "ground_truth": 0}, {"key": "1de0cae2832cf41f49e6fad8254247c789dfabd2", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.3923368151194255, "ground_truth": 0}, {"key": "1de0cae2832cf41f49e6fad8254247c789dfabd2", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.19930799280619563, "ground_truth": 0}, {"key": "1de0cae2832cf41f49e6fad8254247c789dfabd2", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.3886180073384743, "ground_truth": 0}, {"key": "6c6e51ef20def117ed9114ed8d8480b3a100f1c3", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.48438007300044444, "ground_truth": 0}, {"key": "6c6e51ef20def117ed9114ed8d8480b3a100f1c3", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.5888891231388778, "ground_truth": 0}, {"key": "6c6e51ef20def117ed9114ed8d8480b3a100f1c3", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.44552952844700167, "ground_truth": 0}, {"key": "6c6e51ef20def117ed9114ed8d8480b3a100f1c3", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.7310585779528482, "ground_truth": 0}, {"key": "6c6e51ef20def117ed9114ed8d8480b3a100f1c3", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.7826624988810257, "ground_truth": 0}, {"key": "b8c755b8921f7917d161605d2ef404d9551f3846", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.11596070599232959, "ground_truth": 0}, {"key": "b8c755b8921f7917d161605d2ef404d9551f3846", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.11201594531733321, "ground_truth": 0}, {"key": "b8c755b8921f7917d161605d2ef404d9551f3846", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.6334102482306176, "ground_truth": 0}, {"key": "b8c755b8921f7917d161605d2ef404d9551f3846", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.22000710607652163, "ground_truth": 0}, {"key": "b8c755b8921f7917d161605d2ef404d9551f3846", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.22135069126005993, "ground_truth": 0}, {"key": "dc7e18d14b8ad29abbd79f554324ec7b8ba8b9c0", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.9778834079018303, "ground_truth": 0}, {"key": "dc7e18d14b8ad29abbd79f554324ec7b8ba8b9c0", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.9241418209290148, "ground_truth": 0}, {"key": "dc7e18d14b8ad29abbd79f554324ec7b8ba8b9c0", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.4320634038360807, "ground_truth": 0}, {"key": "dc7e18d14b8ad29abbd79f554324ec7b8ba8b9c0", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.8568123009427164, "ground_truth": 0}, {"key": "dc7e18d14b8ad29abbd79f554324ec7b8ba8b9c0", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.4629586087292478, "ground_truth": 0}, {"key": "a7fc90db6c296663b1b7fc057451dfd45019342d", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.37754069394227385, "ground_truth": 0}, {"key": "a7fc90db6c296663b1b7fc057451dfd45019342d", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.4167966312374783, "ground_truth": 0}, {"key": "a7fc90db6c296663b1b7fc057451dfd45019342d", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.3923368374222981, "ground_truth": 0}, {"key": "a7fc90db6c296663b1b7fc057451dfd45019342d", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.2186693683665333, "ground_truth": 0}, {"key": "a7fc90db6c296663b1b7fc057451dfd45019342d", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.2814056208058913, "ground_truth": 0}, {"key": "7f22fbc4fd81e50c632c5853856965aa4d0065d4", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.5136684598044153, "ground_truth": 0}, {"key": "7f22fbc4fd81e50c632c5853856965aa4d0065d4", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.5736784024650646, "ground_truth": 0}, {"key": "7f22fbc4fd81e50c632c5853856965aa4d0065d4", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.43590152888750083, "ground_truth": 0}, {"key": "7f22fbc4fd81e50c632c5853856965aa4d0065d4", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.3328522948970435, "ground_truth": 0}, {"key": "7f22fbc4fd81e50c632c5853856965aa4d0065d4", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.3793783746006799, "ground_truth": 0}, {"key": "309ae632df7b88a9569d81fa91aff3b9fb03529e", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.2295352235184216, "ground_truth": 0}, {"key": "309ae632df7b88a9569d81fa91aff3b9fb03529e", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.1943678245456113, "ground_truth": 0}, {"key": "309ae632df7b88a9569d81fa91aff3b9fb03529e", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.43974737408556147, "ground_truth": 0}, {"key": "309ae632df7b88a9569d81fa91aff3b9fb03529e", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.17553806679585446, "ground_truth": 0}, {"key": "309ae632df7b88a9569d81fa91aff3b9fb03529e", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.73411952279981, "ground_truth": 0}, {"key": "732304a0901ff14d023d4361c1d41a85724808f3", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.33807714931917765, "ground_truth": 0}, {"key": "732304a0901ff14d023d4361c1d41a85724808f3", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.6113819693789633, "ground_truth": 0}, {"key": "732304a0901ff14d023d4361c1d41a85724808f3", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.25091276466065415, "ground_truth": 0}, {"key": "732304a0901ff14d023d4361c1d41a85724808f3", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.40168779307683866, "ground_truth": 0}, {"key": "732304a0901ff14d023d4361c1d41a85724808f3", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.2991051850443931, "ground_truth": 0}, {"key": "509b9f69b376e4acb8da49d53198699b1e779ea7", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.1980641751073096, "ground_truth": 0}, {"key": "509b9f69b376e4acb8da49d53198699b1e779ea7", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.22953519247653897, "ground_truth": 0}, {"key": "509b9f69b376e4acb8da49d53198699b1e779ea7", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.2782567902455854, "ground_truth": 0}, {"key": "509b9f69b376e4acb8da49d53198699b1e779ea7", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.17895590299899836, "ground_truth": 0}, {"key": "509b9f69b376e4acb8da49d53198699b1e779ea7", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.21206879750828675, "ground_truth": 0}, {"key": "c292860b41f7c9131458cdc44a79febef38ad8a2", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.6297745989212268, "ground_truth": 0}, {"key": "c292860b41f7c9131458cdc44a79febef38ad8a2", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.5813030786190452, "ground_truth": 0}, {"key": "c292860b41f7c9131458cdc44a79febef38ad8a2", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.3998116623692391, "ground_truth": 0}, {"key": "c292860b41f7c9131458cdc44a79febef38ad8a2", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.48047867595614324, "ground_truth": 0}, {"key": "c292860b41f7c9131458cdc44a79febef38ad8a2", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.6893056164075438, "ground_truth": 0}, {"key": "6db7e70883f0241081833487c421bab86fdac26e", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.43974734943126, "ground_truth": 0}, {"key": "6db7e70883f0241081833487c421bab86fdac26e", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.2365162354463109, "ground_truth": 0}, {"key": "6db7e70883f0241081833487c421bab86fdac26e", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.575588005932734, "ground_truth": 0}, {"key": "6db7e70883f0241081833487c421bab86fdac26e", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.4205995884431672, "ground_truth": 0}, {"key": "6db7e70883f0241081833487c421bab86fdac26e", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.5698526764149145, "ground_truth": 0}, {"key": "e51e06234b3f49da16fec69aaee6fb9cd09cb1d8", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.4397473755427057, "ground_truth": 0}, {"key": "e51e06234b3f49da16fec69aaee6fb9cd09cb1d8", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.2845759894335708, "ground_truth": 0}, {"key": "e51e06234b3f49da16fec69aaee6fb9cd09cb1d8", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.5019531121480147, "ground_truth": 0}, {"key": "e51e06234b3f49da16fec69aaee6fb9cd09cb1d8", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.48633152975114247, "ground_truth": 0}, {"key": "e51e06234b3f49da16fec69aaee6fb9cd09cb1d8", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.4863315421743888, "ground_truth": 0}, {"key": "42474528588bac3a27842671a3fa940fed450552", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.361164720452592, "ground_truth": 0}, {"key": "42474528588bac3a27842671a3fa940fed450552", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.8740772278415053, "ground_truth": 0}, {"key": "42474528588bac3a27842671a3fa940fed450552", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.618780435853252, "ground_truth": 0}, {"key": "42474528588bac3a27842671a3fa940fed450552", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.2782567959868677, "ground_truth": 0}, {"key": "42474528588bac3a27842671a3fa940fed450552", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.32423541012421353, "ground_truth": 0}, {"key": "5932d9c8f1da55bad396197ebae0853c515180a5", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.5851011657482258, "ground_truth": 0}, {"key": "5932d9c8f1da55bad396197ebae0853c515180a5", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.6893056222980547, "ground_truth": 0}, {"key": "5932d9c8f1da55bad396197ebae0853c515180a5", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.40356685600408443, "ground_truth": 0}, {"key": "5932d9c8f1da55bad396197ebae0853c515180a5", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.6076631436300844, "ground_truth": 0}, {"key": "5932d9c8f1da55bad396197ebae0853c515180a5", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.4571367167840097, "ground_truth": 0}, {"key": "daacc676fc659bfd147d11b1409ab42615a2f169", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.3849121343425744, "ground_truth": 0}, {"key": "daacc676fc659bfd147d11b1409ab42615a2f169", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.2893717097057587, "ground_truth": 0}, {"key": "daacc676fc659bfd147d11b1409ab42615a2f169", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.4921881159448172, "ground_truth": 0}, {"key": "daacc676fc659bfd147d11b1409ab42615a2f169", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.515619916925225, "ground_truth": 0}, {"key": "daacc676fc659bfd147d11b1409ab42615a2f169", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.4301473253869415, "ground_truth": 0}, {"key": "7a02e707b139791920fb13115d6132541fff7d97", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.23510838910451828, "ground_truth": 0}, {"key": "7a02e707b139791920fb13115d6132541fff7d97", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.4882833892990174, "ground_truth": 0}, {"key": "7a02e707b139791920fb13115d6132541fff7d97", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.3849121593693281, "ground_truth": 0}, {"key": "7a02e707b139791920fb13115d6132541fff7d97", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.16776335084299016, "ground_truth": 0}, {"key": "7a02e707b139791920fb13115d6132541fff7d97", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.5717666174172923, "ground_truth": 0}, {"key": "db1972f0204c7a9c292f4c85e8838251cb26625e", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.4863315417501091, "ground_truth": 0}, {"key": "db1972f0204c7a9c292f4c85e8838251cb26625e", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.6531269120369503, "ground_truth": 0}, {"key": "db1972f0204c7a9c292f4c85e8838251cb26625e", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.40922079064562383, "ground_truth": 0}, {"key": "db1972f0204c7a9c292f4c85e8838251cb26625e", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.4668455765485006, "ground_truth": 0}, {"key": "db1972f0204c7a9c292f4c85e8838251cb26625e", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.46684559774768697, "ground_truth": 0}, {"key": "6defcdfd6995661fd681dc15163d67f6a5d6727b", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.15713685606894723, "ground_truth": 0}, {"key": "6defcdfd6995661fd681dc15163d67f6a5d6727b", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.775944553256842, "ground_truth": 0}, {"key": "6defcdfd6995661fd681dc15163d67f6a5d6727b", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.20689402809107754, "ground_truth": 0}, {"key": "6defcdfd6995661fd681dc15163d67f6a5d6727b", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.12336562055624647, "ground_truth": 0}, {"key": "6defcdfd6995661fd681dc15163d67f6a5d6727b", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.5428632808670355, "ground_truth": 0}, {"key": "24716f5a39d23dafbe9a9df8fa002788d14d020b", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.23231013884025528, "ground_truth": 0}, {"key": "24716f5a39d23dafbe9a9df8fa002788d14d020b", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.19682622223899907, "ground_truth": 0}, {"key": "24716f5a39d23dafbe9a9df8fa002788d14d020b", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.1233656233827866, "ground_truth": 0}, {"key": "24716f5a39d23dafbe9a9df8fa002788d14d020b", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.2798284825870118, "ground_truth": 0}, {"key": "24716f5a39d23dafbe9a9df8fa002788d14d020b", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.4629586133679949, "ground_truth": 0}, {"key": "ab3c98cf7833b842898a568d872e45ceb2f7dda9", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.560252660764872, "ground_truth": 0}, {"key": "ab3c98cf7833b842898a568d872e45ceb2f7dda9", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.75346665696196, "ground_truth": 0}, {"key": "ab3c98cf7833b842898a568d872e45ceb2f7dda9", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.4092207925068611, "ground_truth": 0}, {"key": "ab3c98cf7833b842898a568d872e45ceb2f7dda9", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.6132365416831363, "ground_truth": 0}, {"key": "ab3c98cf7833b842898a568d872e45ceb2f7dda9", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.5640984610064905, "ground_truth": 0}, {"key": "831005755f85012c882f17c3b3699b34a7febb7b", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.9458012693125692, "ground_truth": 0}, {"key": "831005755f85012c882f17c3b3699b34a7febb7b", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.959154284933591, "ground_truth": 0}, {"key": "831005755f85012c882f17c3b3699b34a7febb7b", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.9462003541100308, "ground_truth": 0}, {"key": "831005755f85012c882f17c3b3699b34a7febb7b", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.7264256046697558, "ground_truth": 0}, {"key": "831005755f85012c882f17c3b3699b34a7febb7b", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.8568122937928339, "ground_truth": 0}, {"key": "0590a8c653b7d332d9df195dcf3ce014abb4eff7", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.24220562663601483, "ground_truth": 0}, {"key": "0590a8c653b7d332d9df195dcf3ce014abb4eff7", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.42632160967233773, "ground_truth": 0}, {"key": "0590a8c653b7d332d9df195dcf3ce014abb4eff7", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.3225259934285736, "ground_truth": 0}, {"key": "0590a8c653b7d332d9df195dcf3ce014abb4eff7", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.11838511221274194, "ground_truth": 0}, {"key": "0590a8c653b7d332d9df195dcf3ce014abb4eff7", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.6057990568009016, "ground_truth": 0}, {"key": "f79341438eed40986c3219b67a3b5d87eb6c018a", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.4532618577584353, "ground_truth": 0}, {"key": "f79341438eed40986c3219b67a3b5d87eb6c018a", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.3998116670237535, "ground_truth": 0}, {"key": "f79341438eed40986c3219b67a3b5d87eb6c018a", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.4843800884248813, "ground_truth": 0}, {"key": "f79341438eed40986c3219b67a3b5d87eb6c018a", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.4726834941947069, "ground_truth": 0}, {"key": "f79341438eed40986c3219b67a3b5d87eb6c018a", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.4397473501612485, "ground_truth": 0}, {"key": "8db6225f67580d64a196f2f3197386a6be950a09", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.783988445186864, "ground_truth": 0}, {"key": "8db6225f67580d64a196f2f3197386a6be950a09", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.41489884055049603, "ground_truth": 0}, {"key": "8db6225f67580d64a196f2f3197386a6be950a09", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.5660185224933102, "ground_truth": 0}, {"key": "8db6225f67580d64a196f2f3197386a6be950a09", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.7201714883189528, "ground_truth": 0}, {"key": "8db6225f67580d64a196f2f3197386a6be950a09", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.9621075723357447, "ground_truth": 0}, {"key": "e386d9ed70bac668fa6048b572f445d9b7b62f75", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.46295859358775476, "ground_truth": 0}, {"key": "e386d9ed70bac668fa6048b572f445d9b7b62f75", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.2658804869364084, "ground_truth": 0}, {"key": "e386d9ed70bac668fa6048b572f445d9b7b62f75", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.2213506675512113, "ground_truth": 0}, {"key": "e386d9ed70bac668fa6048b572f445d9b7b62f75", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.2479874212903435, "ground_truth": 0}, {"key": "e386d9ed70bac668fa6048b572f445d9b7b62f75", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.13386748726436404, "ground_truth": 0}, {"key": "e35669d4530ea55bc8f0e451268cab9e9eaeab92", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.3023910828144603, "ground_truth": 0}, {"key": "e35669d4530ea55bc8f0e451268cab9e9eaeab92", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.35936415882952355, "ground_truth": 0}, {"key": "e35669d4530ea55bc8f0e451268cab9e9eaeab92", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.35756754839132043, "ground_truth": 0}, {"key": "e35669d4530ea55bc8f0e451268cab9e9eaeab92", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.4649015735598929, "ground_truth": 0}, {"key": "e35669d4530ea55bc8f0e451268cab9e9eaeab92", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.45132650482942765, "ground_truth": 0}, {"key": "d3ca193f45aef9aa766d52fbc58d6b8f1658ee60", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.11838509989573939, "ground_truth": 0}, {"key": "d3ca193f45aef9aa766d52fbc58d6b8f1658ee60", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.5506073423453083, "ground_truth": 0}, {"key": "d3ca193f45aef9aa766d52fbc58d6b8f1658ee60", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.1451153522933855, "ground_truth": 0}, {"key": "d3ca193f45aef9aa766d52fbc58d6b8f1658ee60", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.11124120985150161, "ground_truth": 0}, {"key": "d3ca193f45aef9aa766d52fbc58d6b8f1658ee60", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.3293917015286047, "ground_truth": 0}, {"key": "1ca9bf09bf534add02b7cfe6ebae6d17cde66286", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.30074559282007035, "ground_truth": 0}, {"key": "1ca9bf09bf534add02b7cfe6ebae6d17cde66286", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.3942009347967045, "ground_truth": 0}, {"key": "1ca9bf09bf534add02b7cfe6ebae6d17cde66286", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.3040416601741917, "ground_truth": 0}, {"key": "1ca9bf09bf534add02b7cfe6ebae6d17cde66286", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.27202453943676336, "ground_truth": 0}, {"key": "1ca9bf09bf534add02b7cfe6ebae6d17cde66286", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.6113819901448949, "ground_truth": 0}, {"key": "c296e88117bef515bd9b36ad560223df3fd2b84c", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.48242914312730667, "ground_truth": 0}, {"key": "c296e88117bef515bd9b36ad560223df3fd2b84c", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.4263215757497033, "ground_truth": 0}, {"key": "c296e88117bef515bd9b36ad560223df3fd2b84c", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.3830641721056283, "ground_truth": 0}, {"key": "c296e88117bef515bd9b36ad560223df3fd2b84c", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.33807710719563183, "ground_truth": 0}, {"key": "c296e88117bef515bd9b36ad560223df3fd2b84c", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.6566582850998358, "ground_truth": 0}, {"key": "c5e11ee4c2f0ae511bd0e1fae2978d070b1efc15", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.3702253638665447, "ground_truth": 0}, {"key": "c5e11ee4c2f0ae511bd0e1fae2978d070b1efc15", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.32766829922219526, "ground_truth": 0}, {"key": "c5e11ee4c2f0ae511bd0e1fae2978d070b1efc15", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.2958398581706646, "ground_truth": 0}, {"key": "c5e11ee4c2f0ae511bd0e1fae2978d070b1efc15", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.258325978266458, "ground_truth": 0}, {"key": "c5e11ee4c2f0ae511bd0e1fae2978d070b1efc15", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.359364134797355, "ground_truth": 0}, {"key": "1fc2d1ecf1ffdc2f0b642b686e1c21de53a4fd28", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.09807932911402242, "ground_truth": 0}, {"key": "1fc2d1ecf1ffdc2f0b642b686e1c21de53a4fd28", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.222700135184903, "ground_truth": 0}, {"key": "1fc2d1ecf1ffdc2f0b642b686e1c21de53a4fd28", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.33111974014023626, "ground_truth": 0}, {"key": "1fc2d1ecf1ffdc2f0b642b686e1c21de53a4fd28", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.11757213628016153, "ground_truth": 0}, {"key": "1fc2d1ecf1ffdc2f0b642b686e1c21de53a4fd28", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.1835936137495303, "ground_truth": 0}, {"key": "6556c64821ece8123c130b27285efe9619c3c7fd", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.3380771179473157, "ground_truth": 0}, {"key": "6556c64821ece8123c130b27285efe9619c3c7fd", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.2465333632990369, "ground_truth": 0}, {"key": "6556c64821ece8123c130b27285efe9619c3c7fd", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.4649015665478685, "ground_truth": 0}, {"key": "6556c64821ece8123c130b27285efe9619c3c7fd", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.48633153412363017, "ground_truth": 0}, {"key": "6556c64821ece8123c130b27285efe9619c3c7fd", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.48438009129191867, "ground_truth": 0}, {"key": "32ba61f4513f7ec21cedb6ddd2a8a93260f8cd56", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.15203224077114358, "ground_truth": 0}, {"key": "32ba61f4513f7ec21cedb6ddd2a8a93260f8cd56", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.14128141654207987, "ground_truth": 0}, {"key": "32ba61f4513f7ec21cedb6ddd2a8a93260f8cd56", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.28937169498364834, "ground_truth": 0}, {"key": "32ba61f4513f7ec21cedb6ddd2a8a93260f8cd56", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.31573596913050495, "ground_truth": 0}, {"key": "32ba61f4513f7ec21cedb6ddd2a8a93260f8cd56", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.18010666055936472, "ground_truth": 0}, {"key": "1146cfc5981ce23511ac1bac5f3957c30bebc7b8", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.06465348917795267, "ground_truth": 0}, {"key": "1146cfc5981ce23511ac1bac5f3957c30bebc7b8", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.24508501357438975, "ground_truth": 0}, {"key": "1146cfc5981ce23511ac1bac5f3957c30bebc7b8", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.017176708643924708, "ground_truth": 0}, {"key": "1146cfc5981ce23511ac1bac5f3957c30bebc7b8", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.11838509986723034, "ground_truth": 0}, {"key": "1146cfc5981ce23511ac1bac5f3957c30bebc7b8", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.14608724257928704, "ground_truth": 0}, {"key": "e060abdb2a5e2ce6152ca0ed53703a9d17b2df36", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.24364244272408214, "ground_truth": 0}, {"key": "e060abdb2a5e2ce6152ca0ed53703a9d17b2df36", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.21469141039757186, "ground_truth": 0}, {"key": "e060abdb2a5e2ce6152ca0ed53703a9d17b2df36", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.3259495015350333, "ground_truth": 0}, {"key": "e060abdb2a5e2ce6152ca0ed53703a9d17b2df36", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.4610167652656119, "ground_truth": 0}, {"key": "e060abdb2a5e2ce6152ca0ed53703a9d17b2df36", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.2845759993843297, "ground_truth": 0}, {"key": "aef2a80ff67e87a8c165a481ede2a643128f4aa7", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.5331544001293379, "ground_truth": 0}, {"key": "aef2a80ff67e87a8c165a481ede2a643128f4aa7", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.7969253843387314, "ground_truth": 0}, {"key": "aef2a80ff67e87a8c165a481ede2a643128f4aa7", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.6224593430753417, "ground_truth": 0}, {"key": "aef2a80ff67e87a8c165a481ede2a643128f4aa7", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.28776781302512067, "ground_truth": 0}, {"key": "aef2a80ff67e87a8c165a481ede2a643128f4aa7", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.27048020032488107, "ground_truth": 0}, {"key": "d4eaedd7f1055f95e9cafa21e870d049f5df8526", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.30239107208574095, "ground_truth": 0}, {"key": "d4eaedd7f1055f95e9cafa21e870d049f5df8526", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.27202455430960143, "ground_truth": 0}, {"key": "d4eaedd7f1055f95e9cafa21e870d049f5df8526", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.5214711564882566, "ground_truth": 0}, {"key": "d4eaedd7f1055f95e9cafa21e870d049f5df8526", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.4111108827649156, "ground_truth": 0}, {"key": "d4eaedd7f1055f95e9cafa21e870d049f5df8526", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.5117165955987378, "ground_truth": 0}, {"key": "ec9531cd58e385f0da60e23b2855a3c5ece3f270", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.24364243744591677, "ground_truth": 0}, {"key": "ec9531cd58e385f0da60e23b2855a3c5ece3f270", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.1801066617444598, "ground_truth": 0}, {"key": "ec9531cd58e385f0da60e23b2855a3c5ece3f270", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.28298810832510973, "ground_truth": 0}, {"key": "ec9531cd58e385f0da60e23b2855a3c5ece3f270", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.327668330524552, "ground_truth": 0}, {"key": "ec9531cd58e385f0da60e23b2855a3c5ece3f270", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.24364241283072566, "ground_truth": 0}, {"key": "b171bad51c8ec09118fd553347c41d9301f195ee", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.22541661791192746, "ground_truth": 0}, {"key": "b171bad51c8ec09118fd553347c41d9301f195ee", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.21076630173053806, "ground_truth": 0}, {"key": "b171bad51c8ec09118fd553347c41d9301f195ee", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.2393493336481256, "ground_truth": 0}, {"key": "b171bad51c8ec09118fd553347c41d9301f195ee", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.15002882074369256, "ground_truth": 0}, {"key": "b171bad51c8ec09118fd553347c41d9301f195ee", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.18242552071039403, "ground_truth": 0}, {"key": "1df14bd442bd39ed653aa77a1e77105d4b321db0", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.33458943617528275, "ground_truth": 0}, {"key": "1df14bd442bd39ed653aa77a1e77105d4b321db0", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.9278877877273598, "ground_truth": 0}, {"key": "1df14bd442bd39ed653aa77a1e77105d4b321db0", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.9230391648782837, "ground_truth": 0}, {"key": "1df14bd442bd39ed653aa77a1e77105d4b321db0", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.77864929121166, "ground_truth": 0}, {"key": "1df14bd442bd39ed653aa77a1e77105d4b321db0", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.8311430504752041, "ground_truth": 0}, {"key": "d4f57e3c18c38696345fb7a3d76a151bb9c5123b", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.16885695921524954, "ground_truth": 0}, {"key": "d4f57e3c18c38696345fb7a3d76a151bb9c5123b", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.15610489147089773, "ground_truth": 0}, {"key": "d4f57e3c18c38696345fb7a3d76a151bb9c5123b", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.2267836326162247, "ground_truth": 0}, {"key": "d4f57e3c18c38696345fb7a3d76a151bb9c5123b", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.11201595834529986, "ground_truth": 0}, {"key": "d4f57e3c18c38696345fb7a3d76a151bb9c5123b", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.35936411469579677, "ground_truth": 0}, {"key": "28bbbf57c580be154f0602cbfe8b63603ef5a3a4", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.2674081867049717, "ground_truth": 0}, {"key": "28bbbf57c580be154f0602cbfe8b63603ef5a3a4", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.23792988713301405, "ground_truth": 0}, {"key": "28bbbf57c580be154f0602cbfe8b63603ef5a3a4", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.39981164208956943, "ground_truth": 0}, {"key": "28bbbf57c580be154f0602cbfe8b63603ef5a3a4", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.30569733296873147, "ground_truth": 0}, {"key": "28bbbf57c580be154f0602cbfe8b63603ef5a3a4", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.2509127937562803, "ground_truth": 0}, {"key": "05850904cabf491c9ab7c0e0d85fd932eb8c0bb0", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.2658804854584094, "ground_truth": 0}, {"key": "05850904cabf491c9ab7c0e0d85fd932eb8c0bb0", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.1993079754735156, "ground_truth": 0}, {"key": "05850904cabf491c9ab7c0e0d85fd932eb8c0bb0", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.1755380765463116, "ground_truth": 0}, {"key": "05850904cabf491c9ab7c0e0d85fd932eb8c0bb0", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.26740816215848723, "ground_truth": 0}, {"key": "05850904cabf491c9ab7c0e0d85fd932eb8c0bb0", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.13386747303957372, "ground_truth": 0}, {"key": "df79c0f955e4ccf51ad45780f865e334d3577bf5", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.5964331582956479, "ground_truth": 0}, {"key": "df79c0f955e4ccf51ad45780f865e334d3577bf5", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.3998116396240062, "ground_truth": 0}, {"key": "df79c0f955e4ccf51ad45780f865e334d3577bf5", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.41869692332948083, "ground_truth": 0}, {"key": "df79c0f955e4ccf51ad45780f865e334d3577bf5", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.42059958826370947, "ground_truth": 0}, {"key": "df79c0f955e4ccf51ad45780f865e334d3577bf5", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.468790615984853, "ground_truth": 0}, {"key": "ffb8b9be838da033f6f3383f324d425556723147", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.5039061557279194, "ground_truth": 0}, {"key": "ffb8b9be838da033f6f3383f324d425556723147", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.2861692299922614, "ground_truth": 0}, {"key": "ffb8b9be838da033f6f3383f324d425556723147", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.42441199193809737, "ground_truth": 0}, {"key": "ffb8b9be838da033f6f3383f324d425556723147", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.37387581251029056, "ground_truth": 0}, {"key": "ffb8b9be838da033f6f3383f324d425556723147", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.22678361525297877, "ground_truth": 0}, {"key": "d70dcffc2c07e08cc121d7126ada53dbc479626e", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.22815649105253552, "ground_truth": 0}, {"key": "d70dcffc2c07e08cc121d7126ada53dbc479626e", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.5350984250077964, "ground_truth": 0}, {"key": "d70dcffc2c07e08cc121d7126ada53dbc479626e", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.24220563094629624, "ground_truth": 0}, {"key": "d70dcffc2c07e08cc121d7126ada53dbc479626e", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.19193279286982903, "ground_truth": 0}, {"key": "d70dcffc2c07e08cc121d7126ada53dbc479626e", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.27048021664123256, "ground_truth": 0}, {"key": "4dc0cef39980df6382f9aee5e150e904fe62965e", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.8244619462201057, "ground_truth": 0}, {"key": "4dc0cef39980df6382f9aee5e150e904fe62965e", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.6334102790599929, "ground_truth": 0}, {"key": "4dc0cef39980df6382f9aee5e150e904fe62965e", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.7057850370403734, "ground_truth": 0}, {"key": "4dc0cef39980df6382f9aee5e150e904fe62965e", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.6406358793455544, "ground_truth": 0}, {"key": "4dc0cef39980df6382f9aee5e150e904fe62965e", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.6959583420109768, "ground_truth": 0}, {"key": "6cb082c504e00c93686ff1e9287a84ba13c12b79", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.25534367499533905, "ground_truth": 0}, {"key": "6cb082c504e00c93686ff1e9287a84ba13c12b79", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.28937168846696487, "ground_truth": 0}, {"key": "6cb082c504e00c93686ff1e9287a84ba13c12b79", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.09534946731149524, "ground_truth": 0}, {"key": "6cb082c504e00c93686ff1e9287a84ba13c12b79", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.07423136905961818, "ground_truth": 0}, {"key": "6cb082c504e00c93686ff1e9287a84ba13c12b79", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.20561503117865876, "ground_truth": 0}, {"key": "19fe2a8e0bef37b495afcc83c2f46b60c56039bf", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.552539702828107, "ground_truth": 0}, {"key": "19fe2a8e0bef37b495afcc83c2f46b60c56039bf", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.5486735236355235, "ground_truth": 0}, {"key": "19fe2a8e0bef37b495afcc83c2f46b60c56039bf", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.5234203184609549, "ground_truth": 0}, {"key": "19fe2a8e0bef37b495afcc83c2f46b60c56039bf", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.34864514248503764, "ground_truth": 0}, {"key": "19fe2a8e0bef37b495afcc83c2f46b60c56039bf", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.4765796660726786, "ground_truth": 0}, {"key": "503c6aaeaf0e61372a896ebe1fdf2a2492844fe4", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.18594717698573868, "ground_truth": 0}, {"key": "503c6aaeaf0e61372a896ebe1fdf2a2492844fe4", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.1366083820010045, "ground_truth": 0}, {"key": "503c6aaeaf0e61372a896ebe1fdf2a2492844fe4", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.20561503484697033, "ground_truth": 0}, {"key": "503c6aaeaf0e61372a896ebe1fdf2a2492844fe4", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.31405052429930524, "ground_truth": 0}, {"key": "503c6aaeaf0e61372a896ebe1fdf2a2492844fe4", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.41300357615586103, "ground_truth": 0}, {"key": "e4007135fdafe84907e2b018da3a4c7ab853c251", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.20689405918032072, "ground_truth": 0}, {"key": "e4007135fdafe84907e2b018da3a4c7ab853c251", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.28937169799538115, "ground_truth": 0}, {"key": "e4007135fdafe84907e2b018da3a4c7ab853c251", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.18594718243616704, "ground_truth": 0}, {"key": "e4007135fdafe84907e2b018da3a4c7ab853c251", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.14318770080603271, "ground_truth": 0}, {"key": "e4007135fdafe84907e2b018da3a4c7ab853c251", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.12336562073959727, "ground_truth": 0}, {"key": "5b97a507eed113ce329e8c85078fb53033bbe567", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.4244120076556785, "ground_truth": 0}, {"key": "5b97a507eed113ce329e8c85078fb53033bbe567", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.40733339988715656, "ground_truth": 0}, {"key": "5b97a507eed113ce329e8c85078fb53033bbe567", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.17106118570741954, "ground_truth": 0}, {"key": "5b97a507eed113ce329e8c85078fb53033bbe567", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.3259495228354969, "ground_truth": 0}, {"key": "5b97a507eed113ce329e8c85078fb53033bbe567", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.3415825162031251, "ground_truth": 0}, {"key": "145a118e355e3a92383b41307a5b473a7c77a8bb", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.7090191572582317, "ground_truth": 0}, {"key": "145a118e355e3a92383b41307a5b473a7c77a8bb", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.5813031181257344, "ground_truth": 0}, {"key": "145a118e355e3a92383b41307a5b473a7c77a8bb", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.6774740024657805, "ground_truth": 0}, {"key": "145a118e355e3a92383b41307a5b473a7c77a8bb", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.43974735523496716, "ground_truth": 0}, {"key": "145a118e355e3a92383b41307a5b473a7c77a8bb", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.6706082835004787, "ground_truth": 0}, {"key": "1f6309c88c5711b2b579e3c0cf699c44d3b56d16", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.1338674861898863, "ground_truth": 0}, {"key": "1f6309c88c5711b2b579e3c0cf699c44d3b56d16", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.22953520098172908, "ground_truth": 0}, {"key": "1f6309c88c5711b2b579e3c0cf699c44d3b56d16", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.1847675069866503, "ground_truth": 0}, {"key": "1f6309c88c5711b2b579e3c0cf699c44d3b56d16", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.48828341397894387, "ground_truth": 0}, {"key": "1f6309c88c5711b2b579e3c0cf699c44d3b56d16", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.2509127741635127, "ground_truth": 0}, {"key": "d8304c60e76a4b16053e74c50abd886dcdf7397c", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.51366847702835, "ground_truth": 0}, {"key": "d8304c60e76a4b16053e74c50abd886dcdf7397c", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.3738758242670969, "ground_truth": 0}, {"key": "d8304c60e76a4b16053e74c50abd886dcdf7397c", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.6531269050468463, "ground_truth": 0}, {"key": "d8304c60e76a4b16053e74c50abd886dcdf7397c", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.39981164432572497, "ground_truth": 0}, {"key": "d8304c60e76a4b16053e74c50abd886dcdf7397c", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.3793783746248535, "ground_truth": 0}, {"key": "d47e5724a866cf365428dbded7740555e5f80f2b", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.33807708037979933, "ground_truth": 0}, {"key": "d47e5724a866cf365428dbded7740555e5f80f2b", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.38861803833174857, "ground_truth": 0}, {"key": "d47e5724a866cf365428dbded7740555e5f80f2b", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.3522017667676319, "ground_truth": 0}, {"key": "d47e5724a866cf365428dbded7740555e5f80f2b", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.21601151847678085, "ground_truth": 0}, {"key": "d47e5724a866cf365428dbded7740555e5f80f2b", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.24944725763847633, "ground_truth": 0}, {"key": "0a078513cee66db2ccaaca1b7b0755c96f0c5c8a", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.6297745991987075, "ground_truth": 0}, {"key": "0a078513cee66db2ccaaca1b7b0755c96f0c5c8a", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.7772998695350051, "ground_truth": 0}, {"key": "0a078513cee66db2ccaaca1b7b0755c96f0c5c8a", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.7490872395892045, "ground_truth": 0}, {"key": "0a078513cee66db2ccaaca1b7b0755c96f0c5c8a", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.6297746244462332, "ground_truth": 0}, {"key": "0a078513cee66db2ccaaca1b7b0755c96f0c5c8a", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.6352224604894422, "ground_truth": 0}, {"key": "f0d93bdd383762936746b48f7e67ffe72cfb1ede", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.39793839664707875, "ground_truth": 0}, {"key": "f0d93bdd383762936746b48f7e67ffe72cfb1ede", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.2751297258225804, "ground_truth": 0}, {"key": "f0d93bdd383762936746b48f7e67ffe72cfb1ede", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.2877677998794893, "ground_truth": 0}, {"key": "f0d93bdd383762936746b48f7e67ffe72cfb1ede", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.1883239845699625, "ground_truth": 0}, {"key": "f0d93bdd383762936746b48f7e67ffe72cfb1ede", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.3522017609962068, "ground_truth": 0}, {"key": "38649fdccec39afa649297349b2ad2e5e1a39d82", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.2133771635012104, "ground_truth": 0}, {"key": "38649fdccec39afa649297349b2ad2e5e1a39d82", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.9241418262588873, "ground_truth": 0}, {"key": "38649fdccec39afa649297349b2ad2e5e1a39d82", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.17217182964961114, "ground_truth": 0}, {"key": "38649fdccec39afa649297349b2ad2e5e1a39d82", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.14608724787029007, "ground_truth": 0}, {"key": "38649fdccec39afa649297349b2ad2e5e1a39d82", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.5175708930975272, "ground_truth": 0}, {"key": "d86d9a4e0b39556578f24ff54ed82716f0375fdb", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.12592276950951917, "ground_truth": 0}, {"key": "d86d9a4e0b39556578f24ff54ed82716f0375fdb", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.10669059705572054, "ground_truth": 0}, {"key": "d86d9a4e0b39556578f24ff54ed82716f0375fdb", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.35577490039623605, "ground_truth": 0}, {"key": "d86d9a4e0b39556578f24ff54ed82716f0375fdb", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.24508502033827778, "ground_truth": 0}, {"key": "d86d9a4e0b39556578f24ff54ed82716f0375fdb", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.17667161356572064, "ground_truth": 0}, {"key": "d10d57811499caa54276d3e14f89c45cb1a8958f", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.16344543949020718, "ground_truth": 0}, {"key": "d10d57811499caa54276d3e14f89c45cb1a8958f", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.18242553829557423, "ground_truth": 0}, {"key": "d10d57811499caa54276d3e14f89c45cb1a8958f", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.13117322567694176, "ground_truth": 0}, {"key": "d10d57811499caa54276d3e14f89c45cb1a8958f", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.12765263532179097, "ground_truth": 0}, {"key": "d10d57811499caa54276d3e14f89c45cb1a8958f", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.2094696706316294, "ground_truth": 0}, {"key": "66646c49afb65308491ec8ca6db79aa76263cc69", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.15817435162246135, "ground_truth": 0}, {"key": "66646c49afb65308491ec8ca6db79aa76263cc69", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.3007455839616805, "ground_truth": 0}, {"key": "66646c49afb65308491ec8ca6db79aa76263cc69", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.19072402756948664, "ground_truth": 0}, {"key": "66646c49afb65308491ec8ca6db79aa76263cc69", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.23091974463486667, "ground_truth": 0}, {"key": "66646c49afb65308491ec8ca6db79aa76263cc69", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.16238004650118884, "ground_truth": 0}, {"key": "7fbd6d867def06f6ae4c051562dc36ab8d0038c0", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.23091975787642285, "ground_truth": 0}, {"key": "7fbd6d867def06f6ae4c051562dc36ab8d0038c0", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.2782567885532525, "ground_truth": 0}, {"key": "7fbd6d867def06f6ae4c051562dc36ab8d0038c0", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.7879311961021794, "ground_truth": 0}, {"key": "7fbd6d867def06f6ae4c051562dc36ab8d0038c0", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.23792987993257725, "ground_truth": 0}, {"key": "7fbd6d867def06f6ae4c051562dc36ab8d0038c0", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.5983121925784305, "ground_truth": 0}, {"key": "5c243b51bf4de7f6974338d71ac26317254007bb", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.5602526379702952, "ground_truth": 0}, {"key": "5c243b51bf4de7f6974338d71ac26317254007bb", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.4668455602665104, "ground_truth": 0}, {"key": "5c243b51bf4de7f6974338d71ac26317254007bb", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.7431680050450361, "ground_truth": 0}, {"key": "5c243b51bf4de7f6974338d71ac26317254007bb", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.4571367097774642, "ground_truth": 0}, {"key": "5c243b51bf4de7f6974338d71ac26317254007bb", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.3684056975116844, "ground_truth": 0}, {"key": "56b79c03a77d5261382e4705f3537396473f55cf", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.5983122211964771, "ground_truth": 0}, {"key": "56b79c03a77d5261382e4705f3537396473f55cf", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.28776779277553965, "ground_truth": 0}, {"key": "56b79c03a77d5261382e4705f3537396473f55cf", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.7401743496063051, "ground_truth": 0}, {"key": "56b79c03a77d5261382e4705f3537396473f55cf", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.6334102820620722, "ground_truth": 0}, {"key": "56b79c03a77d5261382e4705f3537396473f55cf", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.7356416236321842, "ground_truth": 0}, {"key": "7382d171d71d3219c5ad0a13ea0ac92ac6b6998b", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.1655930968997687, "ground_truth": 0}, {"key": "7382d171d71d3219c5ad0a13ea0ac92ac6b6998b", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.42250461671880746, "ground_truth": 0}, {"key": "7382d171d71d3219c5ad0a13ea0ac92ac6b6998b", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.14223188008488558, "ground_truth": 0}, {"key": "7382d171d71d3219c5ad0a13ea0ac92ac6b6998b", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.42632158303062245, "ground_truth": 0}, {"key": "7382d171d71d3219c5ad0a13ea0ac92ac6b6998b", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.45713669195836704, "ground_truth": 0}, {"key": "ef1a5fa8dbba16e4d7ef3fc8cd540c2f55691fc8", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.20817892818776712, "ground_truth": 0}, {"key": "ef1a5fa8dbba16e4d7ef3fc8cd540c2f55691fc8", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.2958398547067321, "ground_truth": 0}, {"key": "ef1a5fa8dbba16e4d7ef3fc8cd540c2f55691fc8", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.5679365852488063, "ground_truth": 0}, {"key": "ef1a5fa8dbba16e4d7ef3fc8cd540c2f55691fc8", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.1571368537039667, "ground_truth": 0}, {"key": "ef1a5fa8dbba16e4d7ef3fc8cd540c2f55691fc8", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.35936411644855065, "ground_truth": 0}, {"key": "1ba0f66a7f4f23171634a3455893f4d5b8b94db4", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.2958398365147541, "ground_truth": 0}, {"key": "1ba0f66a7f4f23171634a3455893f4d5b8b94db4", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.20817893577362656, "ground_truth": 0}, {"key": "1ba0f66a7f4f23171634a3455893f4d5b8b94db4", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.2267836462716356, "ground_truth": 0}, {"key": "1ba0f66a7f4f23171634a3455893f4d5b8b94db4", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.2613309468379167, "ground_truth": 0}, {"key": "1ba0f66a7f4f23171634a3455893f4d5b8b94db4", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.21733751883682567, "ground_truth": 0}, {"key": "3131e8ba238a31d83cad00bc7b02933b0a3587b3", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.4532618537146296, "ground_truth": 0}, {"key": "3131e8ba238a31d83cad00bc7b02933b0a3587b3", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.5813031181257344, "ground_truth": 0}, {"key": "3131e8ba238a31d83cad00bc7b02933b0a3587b3", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.6132365554860679, "ground_truth": 0}, {"key": "3131e8ba238a31d83cad00bc7b02933b0a3587b3", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.43974735523496716, "ground_truth": 0}, {"key": "3131e8ba238a31d83cad00bc7b02933b0a3587b3", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.6706082835004787, "ground_truth": 0}, {"key": "112bc4ab4b6e7d6dd35fc33cd946fbfc4c9356d6", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.2043419046082194, "ground_truth": 0}, {"key": "112bc4ab4b6e7d6dd35fc33cd946fbfc4c9356d6", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.27825680697380767, "ground_truth": 0}, {"key": "112bc4ab4b6e7d6dd35fc33cd946fbfc4c9356d6", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.232310140921863, "ground_truth": 0}, {"key": "112bc4ab4b6e7d6dd35fc33cd946fbfc4c9356d6", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.11279539444667543, "ground_truth": 0}, {"key": "112bc4ab4b6e7d6dd35fc33cd946fbfc4c9356d6", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.1766716087554792, "ground_truth": 0}, {"key": "3b1d3309825780556178569cd40d880a793f8da7", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.4186969192612279, "ground_truth": 0}, {"key": "3b1d3309825780556178569cd40d880a793f8da7", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.4263215968461778, "ground_truth": 0}, {"key": "3b1d3309825780556178569cd40d880a793f8da7", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.4513265124490691, "ground_truth": 0}, {"key": "3b1d3309825780556178569cd40d880a793f8da7", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.3557748889785292, "ground_truth": 0}, {"key": "3b1d3309825780556178569cd40d880a793f8da7", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.6688802694011101, "ground_truth": 0}, {"key": "c977693b405a89cec98e53b05199e608fd6adeca", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.304041658438577, "ground_truth": 0}, {"key": "c977693b405a89cec98e53b05199e608fd6adeca", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.5214711780622081, "ground_truth": 0}, {"key": "c977693b405a89cec98e53b05199e608fd6adeca", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.40356685083828436, "ground_truth": 0}, {"key": "c977693b405a89cec98e53b05199e608fd6adeca", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.5755880169811265, "ground_truth": 0}, {"key": "c977693b405a89cec98e53b05199e608fd6adeca", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.5583269812227557, "ground_truth": 0}, {"key": "c84e272a80fa95f863e016bc54df0841fd83fc12", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.32252599565966245, "ground_truth": 0}, {"key": "c84e272a80fa95f863e016bc54df0841fd83fc12", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.32939167486776505, "ground_truth": 0}, {"key": "c84e272a80fa95f863e016bc54df0841fd83fc12", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.15102780399246857, "ground_truth": 0}, {"key": "c84e272a80fa95f863e016bc54df0841fd83fc12", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.3363310602197337, "ground_truth": 0}, {"key": "c84e272a80fa95f863e016bc54df0841fd83fc12", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.6825737185492325, "ground_truth": 0}, {"key": "f51cff1d73cd0f3954376d7b3eab1d5b2ccb354c", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.30404166148832457, "ground_truth": 0}, {"key": "f51cff1d73cd0f3954376d7b3eab1d5b2ccb354c", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.46684560899110494, "ground_truth": 0}, {"key": "f51cff1d73cd0f3954376d7b3eab1d5b2ccb354c", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.2925952790100534, "ground_truth": 0}, {"key": "f51cff1d73cd0f3954376d7b3eab1d5b2ccb354c", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.2877678181322805, "ground_truth": 0}, {"key": "f51cff1d73cd0f3954376d7b3eab1d5b2ccb354c", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.19072402807527092, "ground_truth": 0}, {"key": "a98f1a0258f641788e570264b79e5c816f80054f", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.18476752080842268, "ground_truth": 0}, {"key": "a98f1a0258f641788e570264b79e5c816f80054f", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.3647775437092872, "ground_truth": 0}, {"key": "a98f1a0258f641788e570264b79e5c816f80054f", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.350421377488074, "ground_truth": 0}, {"key": "a98f1a0258f641788e570264b79e5c816f80054f", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.21206879727740938, "ground_truth": 0}, {"key": "a98f1a0258f641788e570264b79e5c816f80054f", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.2553436687364341, "ground_truth": 0}, {"key": "d69d50059c96bd729e9e4c54eee7901d43c0181d", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.8816149126617913, "ground_truth": 0}, {"key": "d69d50059c96bd729e9e4c54eee7901d43c0181d", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.6619228750530323, "ground_truth": 0}, {"key": "d69d50059c96bd729e9e4c54eee7901d43c0181d", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.4359014891968405, "ground_truth": 0}, {"key": "d69d50059c96bd729e9e4c54eee7901d43c0181d", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.2958398678288441, "ground_truth": 0}, {"key": "d69d50059c96bd729e9e4c54eee7901d43c0181d", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.19072401472359587, "ground_truth": 0}, {"key": "379692c378381f092c0bae0516ea8abc5bdb98b8", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.2479874373307209, "ground_truth": 0}, {"key": "379692c378381f092c0bae0516ea8abc5bdb98b8", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.24653335277096744, "ground_truth": 0}, {"key": "379692c378381f092c0bae0516ea8abc5bdb98b8", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.1285251456529991, "ground_truth": 0}, {"key": "379692c378381f092c0bae0516ea8abc5bdb98b8", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.33807711487011854, "ground_truth": 0}, {"key": "379692c378381f092c0bae0516ea8abc5bdb98b8", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.21076632273558862, "ground_truth": 0}, {"key": "88b0d86cd06cd05a090f6a6c3a3ed17bf5f96df3", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.42441199674250946, "ground_truth": 0}, {"key": "88b0d86cd06cd05a090f6a6c3a3ed17bf5f96df3", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.7745833944508147, "ground_truth": 0}, {"key": "88b0d86cd06cd05a090f6a6c3a3ed17bf5f96df3", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.21733751784893687, "ground_truth": 0}, {"key": "88b0d86cd06cd05a090f6a6c3a3ed17bf5f96df3", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.1919327905330743, "ground_truth": 0}, {"key": "88b0d86cd06cd05a090f6a6c3a3ed17bf5f96df3", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.23651625434880846, "ground_truth": 0}, {"key": "3b46e80db81819fdcb8b8044941f64d0fa5abd11", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.4824291161397336, "ground_truth": 0}, {"key": "3b46e80db81819fdcb8b8044941f64d0fa5abd11", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.4902356361201004, "ground_truth": 0}, {"key": "3b46e80db81819fdcb8b8044941f64d0fa5abd11", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.48242911971823127, "ground_truth": 0}, {"key": "3b46e80db81819fdcb8b8044941f64d0fa5abd11", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.43974733183578424, "ground_truth": 0}, {"key": "3b46e80db81819fdcb8b8044941f64d0fa5abd11", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.32766832071351754, "ground_truth": 0}, {"key": "786d56f09dae2902696b680395353986051a1139", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.1561049022904704, "ground_truth": 0}, {"key": "786d56f09dae2902696b680395353986051a1139", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.1812632197738601, "ground_truth": 0}, {"key": "786d56f09dae2902696b680395353986051a1139", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.19193279103623662, "ground_truth": 0}, {"key": "786d56f09dae2902696b680395353986051a1139", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.15610489011819, "ground_truth": 0}, {"key": "786d56f09dae2902696b680395353986051a1139", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.1393963832088174, "ground_truth": 0}, {"key": "bf1a3fd65fdd6e91ccec0663d80fa567eada14df", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.7170118821542635, "ground_truth": 0}, {"key": "bf1a3fd65fdd6e91ccec0663d80fa567eada14df", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.26740816722726174, "ground_truth": 0}, {"key": "bf1a3fd65fdd6e91ccec0663d80fa567eada14df", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.3293916951260121, "ground_truth": 0}, {"key": "bf1a3fd65fdd6e91ccec0663d80fa567eada14df", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.3522018035051631, "ground_truth": 0}, {"key": "bf1a3fd65fdd6e91ccec0663d80fa567eada14df", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.334589444358388, "ground_truth": 0}, {"key": "a0bd3047a6de80e3924843f1961ce28347c6a548", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.1993079812672711, "ground_truth": 0}, {"key": "a0bd3047a6de80e3924843f1961ce28347c6a548", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.24944725509230947, "ground_truth": 0}, {"key": "a0bd3047a6de80e3924843f1961ce28347c6a548", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.22815649765306883, "ground_truth": 0}, {"key": "a0bd3047a6de80e3924843f1961ce28347c6a548", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.5117166228125293, "ground_truth": 0}, {"key": "a0bd3047a6de80e3924843f1961ce28347c6a548", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.25982562543447835, "ground_truth": 0}, {"key": "090d322e93af624203dbd5dc83403170071c9e6a", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.23231014629125146, "ground_truth": 0}, {"key": "090d322e93af624203dbd5dc83403170071c9e6a", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.5640984844779533, "ground_truth": 0}, {"key": "090d322e93af624203dbd5dc83403170071c9e6a", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.4225046153179345, "ground_truth": 0}, {"key": "090d322e93af624203dbd5dc83403170071c9e6a", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.22815648602979607, "ground_truth": 0}, {"key": "090d322e93af624203dbd5dc83403170071c9e6a", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.2658804779207391, "ground_truth": 0}, {"key": "ed5179817cb8f597a760800fcdce2b8e64fd30dc", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.3904758440910762, "ground_truth": 0}, {"key": "ed5179817cb8f597a760800fcdce2b8e64fd30dc", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.5774953690686847, "ground_truth": 0}, {"key": "ed5179817cb8f597a760800fcdce2b8e64fd30dc", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.41300355579919257, "ground_truth": 0}, {"key": "ed5179817cb8f597a760800fcdce2b8e64fd30dc", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.34158248752572457, "ground_truth": 0}, {"key": "ed5179817cb8f597a760800fcdce2b8e64fd30dc", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.700894824638178, "ground_truth": 0}, {"key": "571a8023d0deed8c667dd41fed88290309e56927", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.15203222967727342, "ground_truth": 0}, {"key": "571a8023d0deed8c667dd41fed88290309e56927", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.18713267452583182, "ground_truth": 0}, {"key": "571a8023d0deed8c667dd41fed88290309e56927", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.08819004715077465, "ground_truth": 0}, {"key": "571a8023d0deed8c667dd41fed88290309e56927", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.05665241983896737, "ground_truth": 0}, {"key": "571a8023d0deed8c667dd41fed88290309e56927", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.08819003768016097, "ground_truth": 0}, {"key": "544d7c0cba7df38cc8dda8d0d91c6845cf5f52bb", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.06608537640896056, "ground_truth": 0}, {"key": "544d7c0cba7df38cc8dda8d0d91c6845cf5f52bb", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.18594720767755168, "ground_truth": 0}, {"key": "544d7c0cba7df38cc8dda8d0d91c6845cf5f52bb", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.11757213552848692, "ground_truth": 0}, {"key": "544d7c0cba7df38cc8dda8d0d91c6845cf5f52bb", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.12940272120974353, "ground_truth": 0}, {"key": "544d7c0cba7df38cc8dda8d0d91c6845cf5f52bb", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.17781088040188384, "ground_truth": 0}, {"key": "cbd3a0715a91ac8f651aa7b1f2c1fb37a2ef8a69", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.4054487225296471, "ground_truth": 0}, {"key": "cbd3a0715a91ac8f651aa7b1f2c1fb37a2ef8a69", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.4824291180951757, "ground_truth": 0}, {"key": "cbd3a0715a91ac8f651aa7b1f2c1fb37a2ef8a69", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.44360043365928753, "ground_truth": 0}, {"key": "cbd3a0715a91ac8f651aa7b1f2c1fb37a2ef8a69", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.4629586104171489, "ground_truth": 0}, {"key": "cbd3a0715a91ac8f651aa7b1f2c1fb37a2ef8a69", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.24077458357423534, "ground_truth": 0}, {"key": "4ca8b3cf75948dffea7b96e71bf1d9621107354b", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.5409238635984054, "ground_truth": 0}, {"key": "4ca8b3cf75948dffea7b96e71bf1d9621107354b", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.7185944146671935, "ground_truth": 0}, {"key": "4ca8b3cf75948dffea7b96e71bf1d9621107354b", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.46684560355350496, "ground_truth": 0}, {"key": "4ca8b3cf75948dffea7b96e71bf1d9621107354b", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.7905303103573639, "ground_truth": 0}, {"key": "4ca8b3cf75948dffea7b96e71bf1d9621107354b", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.6723317111657519, "ground_truth": 0}, {"key": "98f04e49605f36e0236b206fcb26a1549a7c00c6", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.2751297474725296, "ground_truth": 0}, {"key": "98f04e49605f36e0236b206fcb26a1549a7c00c6", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.4167966505018143, "ground_truth": 0}, {"key": "98f04e49605f36e0236b206fcb26a1549a7c00c6", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.25238403767007656, "ground_truth": 0}, {"key": "98f04e49605f36e0236b206fcb26a1549a7c00c6", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.41679660817742575, "ground_truth": 0}, {"key": "98f04e49605f36e0236b206fcb26a1549a7c00c6", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.6169358527959539, "ground_truth": 0}, {"key": "fb0003754a764d7f3252120de58b515d1f882556", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.4532618282571193, "ground_truth": 0}, {"key": "fb0003754a764d7f3252120de58b515d1f882556", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.5964331543386026, "ground_truth": 0}, {"key": "fb0003754a764d7f3252120de58b515d1f882556", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.4263216047911826, "ground_truth": 0}, {"key": "fb0003754a764d7f3252120de58b515d1f882556", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.403566836925095, "ground_truth": 0}, {"key": "fb0003754a764d7f3252120de58b515d1f882556", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.35398631717652224, "ground_truth": 0}, {"key": "0130f10c1d700cf42cad5fd24b242667342c86be", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.18476750652219176, "ground_truth": 0}, {"key": "0130f10c1d700cf42cad5fd24b242667342c86be", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.27512972128770846, "ground_truth": 0}, {"key": "0130f10c1d700cf42cad5fd24b242667342c86be", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.14706451464109158, "ground_truth": 0}, {"key": "0130f10c1d700cf42cad5fd24b242667342c86be", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.307357987887576, "ground_truth": 0}, {"key": "0130f10c1d700cf42cad5fd24b242667342c86be", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.24364245129631568, "ground_truth": 0}, {"key": "fb8431bc320c2c1a6c32699da0fdae228ed8d73b", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.4746311840382791, "ground_truth": 0}, {"key": "fb8431bc320c2c1a6c32699da0fdae228ed8d73b", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.36116472396994925, "ground_truth": 0}, {"key": "fb8431bc320c2c1a6c32699da0fdae228ed8d73b", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.4186969104355812, "ground_truth": 0}, {"key": "fb8431bc320c2c1a6c32699da0fdae228ed8d73b", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.4320633886631343, "ground_truth": 0}, {"key": "fb8431bc320c2c1a6c32699da0fdae228ed8d73b", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.28140561294691496, "ground_truth": 0}, {"key": "875d564015e85f88103edf0b36ce10e292334902", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.3942009631976731, "ground_truth": 0}, {"key": "875d564015e85f88103edf0b36ce10e292334902", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.2974699142607926, "ground_truth": 0}, {"key": "875d564015e85f88103edf0b36ce10e292334902", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.5058591092321455, "ground_truth": 0}, {"key": "875d564015e85f88103edf0b36ce10e292334902", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.1993080034503136, "ground_truth": 0}, {"key": "875d564015e85f88103edf0b36ce10e292334902", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.4167966740190245, "ground_truth": 0}, {"key": "53102b470b50905c033a90940fc6fa87190f7343", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.05379964468005004, "ground_truth": 0}, {"key": "53102b470b50905c033a90940fc6fa87190f7343", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.2674081346733144, "ground_truth": 0}, {"key": "53102b470b50905c033a90940fc6fa87190f7343", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.12940272697979346, "ground_truth": 0}, {"key": "53102b470b50905c033a90940fc6fa87190f7343", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.27048020968950026, "ground_truth": 0}, {"key": "53102b470b50905c033a90940fc6fa87190f7343", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.11279540572771712, "ground_truth": 0}, {"key": "58776b77856719aff45f09e50d370f52c756dc10", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.5832033750425444, "ground_truth": 0}, {"key": "58776b77856719aff45f09e50d370f52c756dc10", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.7386690929372448, "ground_truth": 0}, {"key": "58776b77856719aff45f09e50d370f52c756dc10", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.5851011294591761, "ground_truth": 0}, {"key": "58776b77856719aff45f09e50d370f52c756dc10", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.34510526378844847, "ground_truth": 0}, {"key": "58776b77856719aff45f09e50d370f52c756dc10", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.5039062041437603, "ground_truth": 0}, {"key": "1b1479bb6e290e86e4b2a1e862e06909a0a62f8e", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.08035746997626594, "ground_truth": 0}, {"key": "1b1479bb6e290e86e4b2a1e862e06909a0a62f8e", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.10521054290746283, "ground_truth": 0}, {"key": "1b1479bb6e290e86e4b2a1e862e06909a0a62f8e", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.039937313645039926, "ground_truth": 0}, {"key": "1b1479bb6e290e86e4b2a1e862e06909a0a62f8e", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.11357959245175855, "ground_truth": 0}, {"key": "1b1479bb6e290e86e4b2a1e862e06909a0a62f8e", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.18594719714458438, "ground_truth": 0}, {"key": "137019bb8262f8ab776ec6367a0ae4b020fa638e", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.1778108748532583, "ground_truth": 0}, {"key": "137019bb8262f8ab776ec6367a0ae4b020fa638e", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.37022538360022017, "ground_truth": 0}, {"key": "137019bb8262f8ab776ec6367a0ae4b020fa638e", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.8116760043797578, "ground_truth": 0}, {"key": "137019bb8262f8ab776ec6367a0ae4b020fa638e", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.22405544640419967, "ground_truth": 0}, {"key": "137019bb8262f8ab776ec6367a0ae4b020fa638e", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.4474603081849754, "ground_truth": 0}, {"key": "1f738e018a3a193d04ec22612e4fe6b01b4969fe", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.21733753081164217, "ground_truth": 0}, {"key": "1f738e018a3a193d04ec22612e4fe6b01b4969fe", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.1540575612313268, "ground_truth": 0}, {"key": "1f738e018a3a193d04ec22612e4fe6b01b4969fe", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.23510837687583364, "ground_truth": 0}, {"key": "1f738e018a3a193d04ec22612e4fe6b01b4969fe", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.36116473253061504, "ground_truth": 0}, {"key": "1f738e018a3a193d04ec22612e4fe6b01b4969fe", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.1955941033142581, "ground_truth": 0}, {"key": "2bb7b7d5a229ccb9c9b5b4fa1475a54297fc0a25", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.5, "ground_truth": 0}, {"key": "2bb7b7d5a229ccb9c9b5b4fa1475a54297fc0a25", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.32766827567079454, "ground_truth": 0}, {"key": "2bb7b7d5a229ccb9c9b5b4fa1475a54297fc0a25", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.18242552892256664, "ground_truth": 0}, {"key": "2bb7b7d5a229ccb9c9b5b4fa1475a54297fc0a25", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.2309197521098138, "ground_truth": 0}, {"key": "2bb7b7d5a229ccb9c9b5b4fa1475a54297fc0a25", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.3123699993207659, "ground_truth": 0}, {"key": "c136c209869b227e534aca60b6df7e0b26bce7fe", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.7356416444776489, "ground_truth": 0}, {"key": "c136c209869b227e534aca60b6df7e0b26bce7fe", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.8519528029727035, "ground_truth": 0}, {"key": "c136c209869b227e534aca60b6df7e0b26bce7fe", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.5794004253078961, "ground_truth": 0}, {"key": "c136c209869b227e534aca60b6df7e0b26bce7fe", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.6893056182028003, "ground_truth": 0}, {"key": "c136c209869b227e534aca60b6df7e0b26bce7fe", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.8407825929308346, "ground_truth": 0}, {"key": "bfbf2be3d5b9da8425253502393528d0f95d2b5d", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.24077458208186353, "ground_truth": 0}, {"key": "bfbf2be3d5b9da8425253502393528d0f95d2b5d", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.6057990503499131, "ground_truth": 0}, {"key": "bfbf2be3d5b9da8425253502393528d0f95d2b5d", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.851952803833769, "ground_truth": 0}, {"key": "bfbf2be3d5b9da8425253502393528d0f95d2b5d", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.24944723005009442, "ground_truth": 0}, {"key": "bfbf2be3d5b9da8425253502393528d0f95d2b5d", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.4649015778118921, "ground_truth": 0}, {"key": "de149988c9768a12f4a656f1d86efe42af51b4c8", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.39047586256101313, "ground_truth": 0}, {"key": "de149988c9768a12f4a656f1d86efe42af51b4c8", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.23370634493477754, "ground_truth": 0}, {"key": "de149988c9768a12f4a656f1d86efe42af51b4c8", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.3665897352801913, "ground_truth": 0}, {"key": "de149988c9768a12f4a656f1d86efe42af51b4c8", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.22135070553913339, "ground_truth": 0}, {"key": "de149988c9768a12f4a656f1d86efe42af51b4c8", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.4590761509478308, "ground_truth": 0}, {"key": "45986f43dd61461844801c08c8753a71ccbf9083", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.3629691984510763, "ground_truth": 0}, {"key": "45986f43dd61461844801c08c8753a71ccbf9083", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.5350984333686056, "ground_truth": 0}, {"key": "45986f43dd61461844801c08c8753a71ccbf9083", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.3242353800284555, "ground_truth": 0}, {"key": "45986f43dd61461844801c08c8753a71ccbf9083", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.5292633949335207, "ground_truth": 0}, {"key": "45986f43dd61461844801c08c8753a71ccbf9083", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.41679665679349337, "ground_truth": 0}, {"key": "e27256e1314f48219ceca70c273dd8429fc4ca4f", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.3208213094742049, "ground_truth": 0}, {"key": "e27256e1314f48219ceca70c273dd8429fc4ca4f", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.3998116443918302, "ground_truth": 0}, {"key": "e27256e1314f48219ceca70c273dd8429fc4ca4f", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.35577490985843085, "ground_truth": 0}, {"key": "e27256e1314f48219ceca70c273dd8429fc4ca4f", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.21733753140139475, "ground_truth": 0}, {"key": "e27256e1314f48219ceca70c273dd8429fc4ca4f", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.379378392483594, "ground_truth": 0}, {"key": "8da9fddf6f4a0d798e454ee7b778ce0d7ce3c447", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.19930801199522252, "ground_truth": 0}, {"key": "8da9fddf6f4a0d798e454ee7b778ce0d7ce3c447", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.6825737343019762, "ground_truth": 0}, {"key": "8da9fddf6f4a0d798e454ee7b778ce0d7ce3c447", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.22000710415986913, "ground_truth": 0}, {"key": "8da9fddf6f4a0d798e454ee7b778ce0d7ce3c447", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.29098085000376944, "ground_truth": 0}, {"key": "8da9fddf6f4a0d798e454ee7b778ce0d7ce3c447", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.5428632981648848, "ground_truth": 0}, {"key": "d2e357c372891291bbdb4f496792ea9d5807cd3a", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.44552951853110595, "ground_truth": 0}, {"key": "d2e357c372891291bbdb4f496792ea9d5807cd3a", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.4571366969106218, "ground_truth": 0}, {"key": "d2e357c372891291bbdb4f496792ea9d5807cd3a", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.30569732364679125, "ground_truth": 0}, {"key": "d2e357c372891291bbdb4f496792ea9d5807cd3a", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.7122321955697137, "ground_truth": 0}, {"key": "d2e357c372891291bbdb4f496792ea9d5807cd3a", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.39233683469294767, "ground_truth": 0}, {"key": "2a17cad6a35f54ceab81d03772a75c58aa7147ef", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.2465333530666153, "ground_truth": 0}, {"key": "2a17cad6a35f54ceab81d03772a75c58aa7147ef", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.14903529962465945, "ground_truth": 0}, {"key": "2a17cad6a35f54ceab81d03772a75c58aa7147ef", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.23231014779934978, "ground_truth": 0}, {"key": "2a17cad6a35f54ceab81d03772a75c58aa7147ef", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.16559310452259182, "ground_truth": 0}, {"key": "2a17cad6a35f54ceab81d03772a75c58aa7147ef", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.12336561506138478, "ground_truth": 0}, {"key": "4b25022fda48e7f91ab1459f1a6dca501318672e", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.2814056106154343, "ground_truth": 0}, {"key": "4b25022fda48e7f91ab1459f1a6dca501318672e", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.24077460943679577, "ground_truth": 0}, {"key": "4b25022fda48e7f91ab1459f1a6dca501318672e", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.30735800844196726, "ground_truth": 0}, {"key": "4b25022fda48e7f91ab1459f1a6dca501318672e", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.20817891678166522, "ground_truth": 0}, {"key": "4b25022fda48e7f91ab1459f1a6dca501318672e", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.36840570181558147, "ground_truth": 0}, {"key": "62066d76f4ef9e06a1129551c41371bb5d2f7465", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.5331544061055545, "ground_truth": 0}, {"key": "62066d76f4ef9e06a1129551c41371bb5d2f7465", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.8670357710215134, "ground_truth": 0}, {"key": "62066d76f4ef9e06a1129551c41371bb5d2f7465", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.8006919941754403, "ground_truth": 0}, {"key": "62066d76f4ef9e06a1129551c41371bb5d2f7465", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.6791786919404433, "ground_truth": 0}, {"key": "62066d76f4ef9e06a1129551c41371bb5d2f7465", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.8044059073658254, "ground_truth": 0}, {"key": "16c4a27e42066259797d93d5db0239bce0a15f18", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.3738758050394225, "ground_truth": 0}, {"key": "16c4a27e42066259797d93d5db0239bce0a15f18", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.43014734209429367, "ground_truth": 0}, {"key": "16c4a27e42066259797d93d5db0239bce0a15f18", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.4359015410293288, "ground_truth": 0}, {"key": "16c4a27e42066259797d93d5db0239bce0a15f18", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.6531268856909644, "ground_truth": 0}, {"key": "16c4a27e42066259797d93d5db0239bce0a15f18", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.6566582616880915, "ground_truth": 0}, {"key": "8626e8d0c96f4d12eca92423e0c43c6ea3e53545", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.48438008554868195, "ground_truth": 0}, {"key": "8626e8d0c96f4d12eca92423e0c43c6ea3e53545", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.4960938092167172, "ground_truth": 0}, {"key": "8626e8d0c96f4d12eca92423e0c43c6ea3e53545", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.3090237267159314, "ground_truth": 0}, {"key": "8626e8d0c96f4d12eca92423e0c43c6ea3e53545", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.35577488804476354, "ground_truth": 0}, {"key": "8626e8d0c96f4d12eca92423e0c43c6ea3e53545", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.3415825093556582, "ground_truth": 0}, {"key": "f675d806e17d1920e6622d3a925367697c94e58e", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.5907791924320264, "ground_truth": 0}, {"key": "f675d806e17d1920e6622d3a925367697c94e58e", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.5467381916537588, "ground_truth": 0}, {"key": "f675d806e17d1920e6622d3a925367697c94e58e", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.45907609068130784, "ground_truth": 0}, {"key": "f675d806e17d1920e6622d3a925367697c94e58e", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.5331544269809187, "ground_truth": 0}, {"key": "f675d806e17d1920e6622d3a925367697c94e58e", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.7233094738389485, "ground_truth": 0}, {"key": "835b6e4637bd2c3fe2644f2cefa00270e950ebdf", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.28140559491149086, "ground_truth": 0}, {"key": "835b6e4637bd2c3fe2644f2cefa00270e950ebdf", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.22000707589864188, "ground_truth": 0}, {"key": "835b6e4637bd2c3fe2644f2cefa00270e950ebdf", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.6113819552950658, "ground_truth": 0}, {"key": "835b6e4637bd2c3fe2644f2cefa00270e950ebdf", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.28937169525052064, "ground_truth": 0}, {"key": "835b6e4637bd2c3fe2644f2cefa00270e950ebdf", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.7620701070969493, "ground_truth": 0}, {"key": "aec90720358f66b9d149db8afd08fbb821e3aa52", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.7122321861339423, "ground_truth": 0}, {"key": "aec90720358f66b9d149db8afd08fbb821e3aa52", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.6076631720794888, "ground_truth": 0}, {"key": "aec90720358f66b9d149db8afd08fbb821e3aa52", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.1968261935521169, "ground_truth": 0}, {"key": "aec90720358f66b9d149db8afd08fbb821e3aa52", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.4073333701923511, "ground_truth": 0}, {"key": "aec90720358f66b9d149db8afd08fbb821e3aa52", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.5370413910325037, "ground_truth": 0}, {"key": "0033829349643e2964a8c3ce5fd997116ce43f7c", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.23934935688396636, "ground_truth": 0}, {"key": "0033829349643e2964a8c3ce5fd997116ce43f7c", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.34334170169248823, "ground_truth": 0}, {"key": "0033829349643e2964a8c3ce5fd997116ce43f7c", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.41869689278776345, "ground_truth": 0}, {"key": "0033829349643e2964a8c3ce5fd997116ce43f7c", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.08035746795035165, "ground_truth": 0}, {"key": "0033829349643e2964a8c3ce5fd997116ce43f7c", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.43974733949946443, "ground_truth": 0}, {"key": "3276a47234f0aa9eb7d4d06940ffb912be059454", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.22000710151609398, "ground_truth": 0}, {"key": "3276a47234f0aa9eb7d4d06940ffb912be059454", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.2568320018392251, "ground_truth": 0}, {"key": "3276a47234f0aa9eb7d4d06940ffb912be059454", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.3328523310090801, "ground_truth": 0}, {"key": "3276a47234f0aa9eb7d4d06940ffb912be059454", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.48828341695686034, "ground_truth": 0}, {"key": "3276a47234f0aa9eb7d4d06940ffb912be059454", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.39233682252946933, "ground_truth": 0}, {"key": "8d3bb51d711ce00e3fff53625a70923985573834", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.14706452258490768, "ground_truth": 0}, {"key": "8d3bb51d711ce00e3fff53625a70923985573834", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.19682622886589565, "ground_truth": 0}, {"key": "8d3bb51d711ce00e3fff53625a70923985573834", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.2658804835025591, "ground_truth": 0}, {"key": "8d3bb51d711ce00e3fff53625a70923985573834", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.0775176629233468, "ground_truth": 0}, {"key": "8d3bb51d711ce00e3fff53625a70923985573834", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.12252322880418136, "ground_truth": 0}, {"key": "e43fc7e34d05a75894279f55935b25040a6d7017", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.27669052196147126, "ground_truth": 0}, {"key": "e43fc7e34d05a75894279f55935b25040a6d7017", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.24944722561446217, "ground_truth": 0}, {"key": "e43fc7e34d05a75894279f55935b25040a6d7017", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.2523840519656505, "ground_truth": 0}, {"key": "e43fc7e34d05a75894279f55935b25040a6d7017", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.20181323636159568, "ground_truth": 0}, {"key": "e43fc7e34d05a75894279f55935b25040a6d7017", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.3557749152412536, "ground_truth": 0}, {"key": "518daa3f4d9f4eb8d3e6dec7852c8b645d1ceb49", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.5214711509628577, "ground_truth": 0}, {"key": "518daa3f4d9f4eb8d3e6dec7852c8b645d1ceb49", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.25832599535536843, "ground_truth": 0}, {"key": "518daa3f4d9f4eb8d3e6dec7852c8b645d1ceb49", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.390475855623459, "ground_truth": 0}, {"key": "518daa3f4d9f4eb8d3e6dec7852c8b645d1ceb49", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.26740817032661257, "ground_truth": 0}, {"key": "518daa3f4d9f4eb8d3e6dec7852c8b645d1ceb49", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.5448013836937559, "ground_truth": 0}, {"key": "a86f10b66912e0221e9ad4d44c37fc7f4e138ed2", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.6808786171865662, "ground_truth": 0}, {"key": "a86f10b66912e0221e9ad4d44c37fc7f4e138ed2", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.6959583306103855, "ground_truth": 0}, {"key": "a86f10b66912e0221e9ad4d44c37fc7f4e138ed2", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.8255897212558645, "ground_truth": 0}, {"key": "a86f10b66912e0221e9ad4d44c37fc7f4e138ed2", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.9648551517949672, "ground_truth": 0}, {"key": "a86f10b66912e0221e9ad4d44c37fc7f4e138ed2", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.6477982537696922, "ground_truth": 0}, {"key": "a34829c5a83a3ef39c34b57b65cc48c9bf11f14b", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.2479874373307209, "ground_truth": 0}, {"key": "a34829c5a83a3ef39c34b57b65cc48c9bf11f14b", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.24653335277096744, "ground_truth": 0}, {"key": "a34829c5a83a3ef39c34b57b65cc48c9bf11f14b", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.17217183963813432, "ground_truth": 0}, {"key": "a34829c5a83a3ef39c34b57b65cc48c9bf11f14b", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.2436424361338122, "ground_truth": 0}, {"key": "a34829c5a83a3ef39c34b57b65cc48c9bf11f14b", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.2553436721363193, "ground_truth": 0}, {"key": "05c6b2a21f9c0ffd5f0c76c9ce4c6d3d875fcf39", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.3293917308464142, "ground_truth": 0}, {"key": "05c6b2a21f9c0ffd5f0c76c9ce4c6d3d875fcf39", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.7690802355224409, "ground_truth": 0}, {"key": "05c6b2a21f9c0ffd5f0c76c9ce4c6d3d875fcf39", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.3867634384606892, "ground_truth": 0}, {"key": "05c6b2a21f9c0ffd5f0c76c9ce4c6d3d875fcf39", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.4035668424644331, "ground_truth": 0}, {"key": "05c6b2a21f9c0ffd5f0c76c9ce4c6d3d875fcf39", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.6495786623332276, "ground_truth": 0}, {"key": "b3e6507640b009ed51c8c8f8be85d0b7fec5b579", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.8418256359747115, "ground_truth": 0}, {"key": "b3e6507640b009ed51c8c8f8be85d0b7fec5b579", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.8697145872277364, "ground_truth": 0}, {"key": "b3e6507640b009ed51c8c8f8be85d0b7fec5b579", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.8895288441641515, "ground_truth": 0}, {"key": "b3e6507640b009ed51c8c8f8be85d0b7fec5b579", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.9005297769391372, "ground_truth": 0}, {"key": "b3e6507640b009ed51c8c8f8be85d0b7fec5b579", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.8705972647661049, "ground_truth": 0}, {"key": "6e930c55a62640d218e4b94f39cb7c83b6ad9117", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.09268777803553138, "ground_truth": 0}, {"key": "6e930c55a62640d218e4b94f39cb7c83b6ad9117", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.11279540002573535, "ground_truth": 0}, {"key": "6e930c55a62640d218e4b94f39cb7c83b6ad9117", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.24508499194581368, "ground_truth": 0}, {"key": "6e930c55a62640d218e4b94f39cb7c83b6ad9117", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.20946968131963428, "ground_truth": 0}, {"key": "6e930c55a62640d218e4b94f39cb7c83b6ad9117", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.2704802166332063, "ground_truth": 0}, {"key": "cd13c83364964da3b3659782e6ef0d2b3dc273b1", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.4111108760671416, "ground_truth": 0}, {"key": "cd13c83364964da3b3659782e6ef0d2b3dc273b1", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.3398276250952993, "ground_truth": 0}, {"key": "cd13c83364964da3b3659782e6ef0d2b3dc273b1", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.5544704749611724, "ground_truth": 0}, {"key": "cd13c83364964da3b3659782e6ef0d2b3dc273b1", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.28616924525918425, "ground_truth": 0}, {"key": "cd13c83364964da3b3659782e6ef0d2b3dc273b1", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.29259531397922306, "ground_truth": 0}, {"key": "328210eaa50ae54cc3d979958c1d2008faa27401", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.224055426763709, "ground_truth": 0}, {"key": "328210eaa50ae54cc3d979958c1d2008faa27401", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.12506537083284094, "ground_truth": 0}, {"key": "328210eaa50ae54cc3d979958c1d2008faa27401", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.31912139869388806, "ground_truth": 0}, {"key": "328210eaa50ae54cc3d979958c1d2008faa27401", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.3557749140984508, "ground_truth": 0}, {"key": "328210eaa50ae54cc3d979958c1d2008faa27401", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.24944726265783113, "ground_truth": 0}, {"key": "b67b63d1da9cccd6e229d5755065d57dd1653feb", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.7563575272889743, "ground_truth": 0}, {"key": "b67b63d1da9cccd6e229d5755065d57dd1653feb", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.6909762931250039, "ground_truth": 0}, {"key": "b67b63d1da9cccd6e229d5755065d57dd1653feb", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.8031737873953214, "ground_truth": 0}, {"key": "b67b63d1da9cccd6e229d5755065d57dd1653feb", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.7264256013432285, "ground_truth": 0}, {"key": "b67b63d1da9cccd6e229d5755065d57dd1653feb", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.7620701027148216, "ground_truth": 0}, {"key": "e4c55cb4bb6e5418d8486fb7c9369b6c84b2716d", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.2658804698526806, "ground_truth": 0}, {"key": "e4c55cb4bb6e5418d8486fb7c9369b6c84b2716d", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.26435834910462164, "ground_truth": 0}, {"key": "e4c55cb4bb6e5418d8486fb7c9369b6c84b2716d", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.14318769135930295, "ground_truth": 0}, {"key": "e4c55cb4bb6e5418d8486fb7c9369b6c84b2716d", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.16132023525157288, "ground_truth": 0}, {"key": "e4c55cb4bb6e5418d8486fb7c9369b6c84b2716d", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.1571368415162177, "ground_truth": 0}, {"key": "544b165ad1d22a5dcbbab469a2aa7666c2868361", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.2479874637852809, "ground_truth": 0}, {"key": "544b165ad1d22a5dcbbab469a2aa7666c2868361", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.3259495181733644, "ground_truth": 0}, {"key": "544b165ad1d22a5dcbbab469a2aa7666c2868361", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.13660839310622694, "ground_truth": 0}, {"key": "544b165ad1d22a5dcbbab469a2aa7666c2868361", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.21601153253177316, "ground_truth": 0}, {"key": "544b165ad1d22a5dcbbab469a2aa7666c2868361", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.2766905331754743, "ground_truth": 0}, {"key": "2577ef64a22c06cf63cb244abfad9ecc46603208", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.23792991318707915, "ground_truth": 0}, {"key": "2577ef64a22c06cf63cb244abfad9ecc46603208", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.5058590920510396, "ground_truth": 0}, {"key": "2577ef64a22c06cf63cb244abfad9ecc46603208", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.25683198318695516, "ground_truth": 0}, {"key": "2577ef64a22c06cf63cb244abfad9ecc46603208", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.19559409086118407, "ground_truth": 0}, {"key": "2577ef64a22c06cf63cb244abfad9ecc46603208", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.3539863350385635, "ground_truth": 0}, {"key": "2a73430dd3232ad3da7570a5ac133d7f29a6b6c6", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.2613309464784731, "ground_truth": 0}, {"key": "2a73430dd3232ad3da7570a5ac133d7f29a6b6c6", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.5717666195380398, "ground_truth": 0}, {"key": "2a73430dd3232ad3da7570a5ac133d7f29a6b6c6", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.6859494332495777, "ground_truth": 0}, {"key": "2a73430dd3232ad3da7570a5ac133d7f29a6b6c6", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.42250464390061804, "ground_truth": 0}, {"key": "2a73430dd3232ad3da7570a5ac133d7f29a6b6c6", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.6334102724491395, "ground_truth": 0}, {"key": "8fbcaf3abc124b7baaa278d382411f43e7e48353", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.1993080202769518, "ground_truth": 0}, {"key": "8fbcaf3abc124b7baaa278d382411f43e7e48353", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.3259495292725315, "ground_truth": 0}, {"key": "8fbcaf3abc124b7baaa278d382411f43e7e48353", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.16559311669738147, "ground_truth": 0}, {"key": "8fbcaf3abc124b7baaa278d382411f43e7e48353", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.5156199316229292, "ground_truth": 0}, {"key": "8fbcaf3abc124b7baaa278d382411f43e7e48353", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.2845760104911572, "ground_truth": 0}, {"key": "bc04e5a298854589044eb5a162f281f3e7e12c16", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.35042140888749224, "ground_truth": 0}, {"key": "bc04e5a298854589044eb5a162f281f3e7e12c16", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.18359362262139903, "ground_truth": 0}, {"key": "bc04e5a298854589044eb5a162f281f3e7e12c16", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.18594720466079767, "ground_truth": 0}, {"key": "bc04e5a298854589044eb5a162f281f3e7e12c16", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.14128140491408456, "ground_truth": 0}, {"key": "bc04e5a298854589044eb5a162f281f3e7e12c16", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.37204877980589457, "ground_truth": 0}, {"key": "8c3b7358950d0684a90736fc39d08340d3ec41ee", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.18952109740556947, "ground_truth": 0}, {"key": "8c3b7358950d0684a90736fc39d08340d3ec41ee", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.5156199442325341, "ground_truth": 0}, {"key": "8c3b7358950d0684a90736fc39d08340d3ec41ee", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.1356895394972633, "ground_truth": 0}, {"key": "8c3b7358950d0684a90736fc39d08340d3ec41ee", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.3293917157220989, "ground_truth": 0}, {"key": "8c3b7358950d0684a90736fc39d08340d3ec41ee", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.1571368474996546, "ground_truth": 0}, {"key": "d1a86381ca59e3471d2863688229922f83218150", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.8438951125213958, "ground_truth": 0}, {"key": "d1a86381ca59e3471d2863688229922f83218150", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.8732148291661569, "ground_truth": 0}, {"key": "d1a86381ca59e3471d2863688229922f83218150", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.6706082745040828, "ground_truth": 0}, {"key": "d1a86381ca59e3471d2863688229922f83218150", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.8418256445733383, "ground_truth": 0}, {"key": "d1a86381ca59e3471d2863688229922f83218150", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.8116760159463187, "ground_truth": 0}, {"key": "313d98f4c6047ff556795b6da47e42e9f650946a", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.2494472202226135, "ground_truth": 0}, {"key": "313d98f4c6047ff556795b6da47e42e9f650946a", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.4532618325372446, "ground_truth": 0}, {"key": "313d98f4c6047ff556795b6da47e42e9f650946a", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.19559408371301182, "ground_truth": 0}, {"key": "313d98f4c6047ff556795b6da47e42e9f650946a", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.4649015968260935, "ground_truth": 0}, {"key": "313d98f4c6047ff556795b6da47e42e9f650946a", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.43206336164759396, "ground_truth": 0}, {"key": "8c0934c689bbc9234dc51eff9d8d156aec106ca4", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.46101680478438084, "ground_truth": 0}, {"key": "8c0934c689bbc9234dc51eff9d8d156aec106ca4", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.468790607853757, "ground_truth": 0}, {"key": "8c0934c689bbc9234dc51eff9d8d156aec106ca4", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.27825677632533263, "ground_truth": 0}, {"key": "8c0934c689bbc9234dc51eff9d8d156aec106ca4", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.6242935301791721, "ground_truth": 0}, {"key": "8c0934c689bbc9234dc51eff9d8d156aec106ca4", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.44360044590201153, "ground_truth": 0}, {"key": "70f210b63211c32ab22354506b7bd9b80ee194af", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.17441027972136483, "ground_truth": 0}, {"key": "70f210b63211c32ab22354506b7bd9b80ee194af", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.1634454401626781, "ground_truth": 0}, {"key": "70f210b63211c32ab22354506b7bd9b80ee194af", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.35220177134403613, "ground_truth": 0}, {"key": "70f210b63211c32ab22354506b7bd9b80ee194af", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.056236348524492774, "ground_truth": 0}, {"key": "70f210b63211c32ab22354506b7bd9b80ee194af", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.13386748596839737, "ground_truth": 0}, {"key": "dea4bf4a53b568dea8b3d5009a24d090485be8c9", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.6297745970715664, "ground_truth": 0}, {"key": "dea4bf4a53b568dea8b3d5009a24d090485be8c9", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.49218814973276953, "ground_truth": 0}, {"key": "dea4bf4a53b568dea8b3d5009a24d090485be8c9", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.44360040936766015, "ground_truth": 0}, {"key": "dea4bf4a53b568dea8b3d5009a24d090485be8c9", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.7416739984767552, "ground_truth": 0}, {"key": "dea4bf4a53b568dea8b3d5009a24d090485be8c9", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.6706082625954989, "ground_truth": 0}, {"key": "3ffb4210cf832dc039ffe7522c47c6eb7a5e5ab5", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.3208212924728456, "ground_truth": 0}, {"key": "3ffb4210cf832dc039ffe7522c47c6eb7a5e5ab5", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.32939167486776505, "ground_truth": 0}, {"key": "3ffb4210cf832dc039ffe7522c47c6eb7a5e5ab5", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.38306416537015436, "ground_truth": 0}, {"key": "3ffb4210cf832dc039ffe7522c47c6eb7a5e5ab5", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.2628418272402797, "ground_truth": 0}, {"key": "3ffb4210cf832dc039ffe7522c47c6eb7a5e5ab5", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.49804687837713996, "ground_truth": 0}, {"key": "c010d72bf64ac4e1c758b7f078aeed89bc57a9db", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.1931473864680578, "ground_truth": 0}, {"key": "c010d72bf64ac4e1c758b7f078aeed89bc57a9db", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.07696083791917943, "ground_truth": 0}, {"key": "c010d72bf64ac4e1c758b7f078aeed89bc57a9db", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.20946967510976394, "ground_truth": 0}, {"key": "c010d72bf64ac4e1c758b7f078aeed89bc57a9db", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.200557682665516, "ground_truth": 0}, {"key": "c010d72bf64ac4e1c758b7f078aeed89bc57a9db", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.12085322697548245, "ground_truth": 0}, {"key": "343644770a597a2dfa7548ba165fa9c6bdc88245", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.4746311556651018, "ground_truth": 0}, {"key": "343644770a597a2dfa7548ba165fa9c6bdc88245", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.5117166147484933, "ground_truth": 0}, {"key": "343644770a597a2dfa7548ba165fa9c6bdc88245", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.40168783111555967, "ground_truth": 0}, {"key": "343644770a597a2dfa7548ba165fa9c6bdc88245", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.48438006299834785, "ground_truth": 0}, {"key": "343644770a597a2dfa7548ba165fa9c6bdc88245", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.5195213083807383, "ground_truth": 0}, {"key": "4b89e8a6a25de61d21a1fed20fb911cd4b1e4b47", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.6076631834883004, "ground_truth": 0}, {"key": "4b89e8a6a25de61d21a1fed20fb911cd4b1e4b47", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.60952417841994, "ground_truth": 0}, {"key": "4b89e8a6a25de61d21a1fed20fb911cd4b1e4b47", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.6654105360431228, "ground_truth": 0}, {"key": "4b89e8a6a25de61d21a1fed20fb911cd4b1e4b47", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.5832033747585235, "ground_truth": 0}, {"key": "4b89e8a6a25de61d21a1fed20fb911cd4b1e4b47", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.5983121755146908, "ground_truth": 0}, {"key": "9b382d27692cb18aa61af350038b175b3ce75e2b", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.16776335188144006, "ground_truth": 0}, {"key": "9b382d27692cb18aa61af350038b175b3ce75e2b", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.24653334120520937, "ground_truth": 0}, {"key": "9b382d27692cb18aa61af350038b175b3ce75e2b", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.4668456049636934, "ground_truth": 0}, {"key": "9b382d27692cb18aa61af350038b175b3ce75e2b", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.07864237769690026, "ground_truth": 0}, {"key": "9b382d27692cb18aa61af350038b175b3ce75e2b", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.4301473217133821, "ground_truth": 0}, {"key": "59be27355e5b86754678f70254cfbb1e6dc8bf0c", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.42441199851487127, "ground_truth": 0}, {"key": "59be27355e5b86754678f70254cfbb1e6dc8bf0c", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.4474603151549755, "ground_truth": 0}, {"key": "59be27355e5b86754678f70254cfbb1e6dc8bf0c", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.44746032019676124, "ground_truth": 0}, {"key": "59be27355e5b86754678f70254cfbb1e6dc8bf0c", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.43398148271264425, "ground_truth": 0}, {"key": "59be27355e5b86754678f70254cfbb1e6dc8bf0c", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.5774953774866642, "ground_truth": 0}, {"key": "ff10934c1dc127286575fb1a6b192da6da21f235", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.5312093667754261, "ground_truth": 0}, {"key": "ff10934c1dc127286575fb1a6b192da6da21f235", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.25386099905792026, "ground_truth": 0}, {"key": "ff10934c1dc127286575fb1a6b192da6da21f235", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.18476750079067275, "ground_truth": 0}, {"key": "ff10934c1dc127286575fb1a6b192da6da21f235", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.27825680400316083, "ground_truth": 0}, {"key": "ff10934c1dc127286575fb1a6b192da6da21f235", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.25982564443113376, "ground_truth": 0}, {"key": "1997690ceabc952c3396cb2a30e9050241f6f6c7", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.24220563491917924, "ground_truth": 0}, {"key": "1997690ceabc952c3396cb2a30e9050241f6f6c7", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.2538610299896825, "ground_truth": 0}, {"key": "1997690ceabc952c3396cb2a30e9050241f6f6c7", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.4035668503801263, "ground_truth": 0}, {"key": "1997690ceabc952c3396cb2a30e9050241f6f6c7", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.2598256363143544, "ground_truth": 0}, {"key": "1997690ceabc952c3396cb2a30e9050241f6f6c7", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.198064181172208, "ground_truth": 0}, {"key": "c676027eea6109621206e3864c4eea30912fe09f", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.2568319854609585, "ground_truth": 0}, {"key": "c676027eea6109621206e3864c4eea30912fe09f", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.40922078867283684, "ground_truth": 0}, {"key": "c676027eea6109621206e3864c4eea30912fe09f", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.17667160632336565, "ground_truth": 0}, {"key": "c676027eea6109621206e3864c4eea30912fe09f", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.2450850111806661, "ground_truth": 0}, {"key": "c676027eea6109621206e3864c4eea30912fe09f", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.5292633804969651, "ground_truth": 0}, {"key": "78e22dd79495204cf719e3728927241bb60b80e1", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.45519860664217904, "ground_truth": 0}, {"key": "78e22dd79495204cf719e3728927241bb60b80e1", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.4980468723643333, "ground_truth": 0}, {"key": "78e22dd79495204cf719e3728927241bb60b80e1", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.34510526616663467, "ground_truth": 0}, {"key": "78e22dd79495204cf719e3728927241bb60b80e1", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.3345894386868627, "ground_truth": 0}, {"key": "78e22dd79495204cf719e3728927241bb60b80e1", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.486331516255403, "ground_truth": 0}, {"key": "6c1a1cf59028ba2567b0a1941e510c40133da1c0", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.25683198393774404, "ground_truth": 0}, {"key": "6c1a1cf59028ba2567b0a1941e510c40133da1c0", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.18126320167332682, "ground_truth": 0}, {"key": "6c1a1cf59028ba2567b0a1941e510c40133da1c0", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.29746996153601096, "ground_truth": 0}, {"key": "6c1a1cf59028ba2567b0a1941e510c40133da1c0", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.2798284778526184, "ground_truth": 0}, {"key": "6c1a1cf59028ba2567b0a1941e510c40133da1c0", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.3191213662721643, "ground_truth": 0}, {"key": "e8bbd5a77edf96611a4b8efcfbc625ec65985e98", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.4320633680406035, "ground_truth": 0}, {"key": "e8bbd5a77edf96611a4b8efcfbc625ec65985e98", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.15817435205766817, "ground_truth": 0}, {"key": "e8bbd5a77edf96611a4b8efcfbc625ec65985e98", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.16995622495935825, "ground_truth": 0}, {"key": "e8bbd5a77edf96611a4b8efcfbc625ec65985e98", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.2845760018234644, "ground_truth": 0}, {"key": "e8bbd5a77edf96611a4b8efcfbc625ec65985e98", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.334589425603045, "ground_truth": 0}, {"key": "4141e012912dbf29c5e792b8654a9a36094b468c", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.46684559149364646, "ground_truth": 0}, {"key": "4141e012912dbf29c5e792b8654a9a36094b468c", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.39233682361377403, "ground_truth": 0}, {"key": "4141e012912dbf29c5e792b8654a9a36094b468c", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.4397473185464449, "ground_truth": 0}, {"key": "4141e012912dbf29c5e792b8654a9a36094b468c", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.571766601096115, "ground_truth": 0}, {"key": "4141e012912dbf29c5e792b8654a9a36094b468c", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.6001883792569213, "ground_truth": 0}, {"key": "d80fa94dc14601e4b82321e2cf749d6915251a70", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.49414087257900824, "ground_truth": 0}, {"key": "d80fa94dc14601e4b82321e2cf749d6915251a70", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.8449215268886838, "ground_truth": 0}, {"key": "d80fa94dc14601e4b82321e2cf749d6915251a70", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.22953522242040109, "ground_truth": 0}, {"key": "d80fa94dc14601e4b82321e2cf749d6915251a70", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.35220177739508723, "ground_truth": 0}, {"key": "d80fa94dc14601e4b82321e2cf749d6915251a70", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.46490156636814134, "ground_truth": 0}, {"key": "11e57b8ed79c4f4b110d81a5cd7152d42411c7a6", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.3647775776443301, "ground_truth": 0}, {"key": "11e57b8ed79c4f4b110d81a5cd7152d42411c7a6", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.3539862815725343, "ground_truth": 0}, {"key": "11e57b8ed79c4f4b110d81a5cd7152d42411c7a6", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.3398275989136035, "ground_truth": 0}, {"key": "11e57b8ed79c4f4b110d81a5cd7152d42411c7a6", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.4436004192681881, "ground_truth": 0}, {"key": "11e57b8ed79c4f4b110d81a5cd7152d42411c7a6", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.29098084203371455, "ground_truth": 0}, {"key": "b55c390e81c5d1d4fa077338d9daaed8978f710b", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.262841840159453, "ground_truth": 0}, {"key": "b55c390e81c5d1d4fa077338d9daaed8978f710b", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.17217185015598338, "ground_truth": 0}, {"key": "b55c390e81c5d1d4fa077338d9daaed8978f710b", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.43014734283233313, "ground_truth": 0}, {"key": "b55c390e81c5d1d4fa077338d9daaed8978f710b", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.4244119781601326, "ground_truth": 0}, {"key": "b55c390e81c5d1d4fa077338d9daaed8978f710b", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.4186968949288197, "ground_truth": 0}, {"key": "d46e1849cbbf875ccd018fd778fa6c433cab4694", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.37204878678026276, "ground_truth": 0}, {"key": "d46e1849cbbf875ccd018fd778fa6c433cab4694", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.4205995930822775, "ground_truth": 0}, {"key": "d46e1849cbbf875ccd018fd778fa6c433cab4694", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.5428632784533929, "ground_truth": 0}, {"key": "d46e1849cbbf875ccd018fd778fa6c433cab4694", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.7476159364989635, "ground_truth": 0}, {"key": "d46e1849cbbf875ccd018fd778fa6c433cab4694", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.5389832358134018, "ground_truth": 0}, {"key": "09b582acc63514f671628e1766ff7e99b258fe9a", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.43206337430285313, "ground_truth": 0}, {"key": "09b582acc63514f671628e1766ff7e99b258fe9a", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.4455294973843797, "ground_truth": 0}, {"key": "09b582acc63514f671628e1766ff7e99b258fe9a", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.28457599415735046, "ground_truth": 0}, {"key": "09b582acc63514f671628e1766ff7e99b258fe9a", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.41111087628140086, "ground_truth": 0}, {"key": "09b582acc63514f671628e1766ff7e99b258fe9a", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.43206336460781086, "ground_truth": 0}, {"key": "c4afe4db222c094c40bb3f271e37e006bcbebf88", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.511716604897507, "ground_truth": 0}, {"key": "c4afe4db222c094c40bb3f271e37e006bcbebf88", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.47073661315984694, "ground_truth": 0}, {"key": "c4afe4db222c094c40bb3f271e37e006bcbebf88", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.544801387482842, "ground_truth": 0}, {"key": "c4afe4db222c094c40bb3f271e37e006bcbebf88", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.6076631844738595, "ground_truth": 0}, {"key": "c4afe4db222c094c40bb3f271e37e006bcbebf88", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.44939260638865014, "ground_truth": 0}, {"key": "e21871892c63ec9638bf1bd3c3a1c3ebdae88796", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.2568319728770239, "ground_truth": 0}, {"key": "e21871892c63ec9638bf1bd3c3a1c3ebdae88796", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.3174262579808476, "ground_truth": 0}, {"key": "e21871892c63ec9638bf1bd3c3a1c3ebdae88796", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.18126319595053497, "ground_truth": 0}, {"key": "e21871892c63ec9638bf1bd3c3a1c3ebdae88796", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.2538609815655209, "ground_truth": 0}, {"key": "e21871892c63ec9638bf1bd3c3a1c3ebdae88796", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.37937834135004, "ground_truth": 0}, {"key": "065378e265a6d5ff38b2e6748ba66490cf8670a9", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.2689414294275935, "ground_truth": 0}, {"key": "065378e265a6d5ff38b2e6748ba66490cf8670a9", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.2005576777454956, "ground_truth": 0}, {"key": "065378e265a6d5ff38b2e6748ba66490cf8670a9", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.12765261337975917, "ground_truth": 0}, {"key": "065378e265a6d5ff38b2e6748ba66490cf8670a9", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.3522017899462087, "ground_truth": 0}, {"key": "065378e265a6d5ff38b2e6748ba66490cf8670a9", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.2598256223183143, "ground_truth": 0}, {"key": "5852e143b34cc30e94aed29193fc2e1dce37b1b1", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.16885695607638246, "ground_truth": 0}, {"key": "5852e143b34cc30e94aed29193fc2e1dce37b1b1", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.278256786731373, "ground_truth": 0}, {"key": "5852e143b34cc30e94aed29193fc2e1dce37b1b1", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.317426269710695, "ground_truth": 0}, {"key": "5852e143b34cc30e94aed29193fc2e1dce37b1b1", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.34510527045976636, "ground_truth": 0}, {"key": "5852e143b34cc30e94aed29193fc2e1dce37b1b1", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.35936415749884504, "ground_truth": 0}, {"key": "af76b4c33b65666487dcc07f75d37de03ff61207", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.4016877833506264, "ground_truth": 0}, {"key": "af76b4c33b65666487dcc07f75d37de03ff61207", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.38676343486965387, "ground_truth": 0}, {"key": "af76b4c33b65666487dcc07f75d37de03ff61207", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.30239108720854146, "ground_truth": 0}, {"key": "af76b4c33b65666487dcc07f75d37de03ff61207", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.3775406650408832, "ground_truth": 0}, {"key": "af76b4c33b65666487dcc07f75d37de03ff61207", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.3830641808807612, "ground_truth": 0}, {"key": "9918924dbaed44429c58ea3638c3847317b71127", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.7892337042528245, "ground_truth": 0}, {"key": "9918924dbaed44429c58ea3638c3847317b71127", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.8740772448650831, "ground_truth": 0}, {"key": "9918924dbaed44429c58ea3638c3847317b71127", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.848972190376789, "ground_truth": 0}, {"key": "9918924dbaed44429c58ea3638c3847317b71127", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.8577681221188606, "ground_truth": 0}, {"key": "9918924dbaed44429c58ea3638c3847317b71127", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.8568123053685037, "ground_truth": 0}, {"key": "c87e99f422b46c03ce77e7cd064bff87c076e1ed", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.1097057744119162, "ground_truth": 0}, {"key": "c87e99f422b46c03ce77e7cd064bff87c076e1ed", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.15713684533248257, "ground_truth": 0}, {"key": "c87e99f422b46c03ce77e7cd064bff87c076e1ed", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.11357958355210998, "ground_truth": 0}, {"key": "c87e99f422b46c03ce77e7cd064bff87c076e1ed", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.11124121553572466, "ground_truth": 0}, {"key": "c87e99f422b46c03ce77e7cd064bff87c076e1ed", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.14511536198911704, "ground_truth": 0}, {"key": "aaca402152fbea1b16e14999374f6394520289a8", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.5058590932730067, "ground_truth": 0}, {"key": "aaca402152fbea1b16e14999374f6394520289a8", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.44746028198639365, "ground_truth": 0}, {"key": "aaca402152fbea1b16e14999374f6394520289a8", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.687629963535093, "ground_truth": 0}, {"key": "aaca402152fbea1b16e14999374f6394520289a8", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.29583985015853675, "ground_truth": 0}, {"key": "aaca402152fbea1b16e14999374f6394520289a8", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.4629586043231227, "ground_truth": 0}, {"key": "259d8cccfcb9b9edc00d757ec6efecde6fc06110", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.5926665958309625, "ground_truth": 0}, {"key": "259d8cccfcb9b9edc00d757ec6efecde6fc06110", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.8152325021305132, "ground_truth": 0}, {"key": "259d8cccfcb9b9edc00d757ec6efecde6fc06110", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.9268352840583693, "ground_truth": 0}, {"key": "259d8cccfcb9b9edc00d757ec6efecde6fc06110", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.8962513597346162, "ground_truth": 0}, {"key": "259d8cccfcb9b9edc00d757ec6efecde6fc06110", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.8824278719523195, "ground_truth": 0}, {"key": "d076dbce6e84b20153db61c809d0f01f46ef1f45", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.3757064572335127, "ground_truth": 0}, {"key": "d076dbce6e84b20153db61c809d0f01f46ef1f45", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.7386690929372448, "ground_truth": 0}, {"key": "d076dbce6e84b20153db61c809d0f01f46ef1f45", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.5583270070396633, "ground_truth": 0}, {"key": "d076dbce6e84b20153db61c809d0f01f46ef1f45", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.49609382913949107, "ground_truth": 0}, {"key": "d076dbce6e84b20153db61c809d0f01f46ef1f45", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.5679365882126448, "ground_truth": 0}, {"key": "c74e983d24450ed9c4ba3a97e345bba707d26853", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.44939263455109557, "ground_truth": 0}, {"key": "c74e983d24450ed9c4ba3a97e345bba707d26853", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.6566582797401938, "ground_truth": 0}, {"key": "c74e983d24450ed9c4ba3a97e345bba707d26853", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.5964331387308667, "ground_truth": 0}, {"key": "c74e983d24450ed9c4ba3a97e345bba707d26853", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.4571367168181759, "ground_truth": 0}, {"key": "c74e983d24450ed9c4ba3a97e345bba707d26853", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.6206216109576944, "ground_truth": 0}, {"key": "0922357b2d0439cf4ba6ec9dc143e11a38b49d8a", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.20817893602915438, "ground_truth": 0}, {"key": "0922357b2d0439cf4ba6ec9dc143e11a38b49d8a", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.24798744794212987, "ground_truth": 0}, {"key": "0922357b2d0439cf4ba6ec9dc143e11a38b49d8a", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.5640984845559802, "ground_truth": 0}, {"key": "0922357b2d0439cf4ba6ec9dc143e11a38b49d8a", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.1311732271570547, "ground_truth": 0}, {"key": "0922357b2d0439cf4ba6ec9dc143e11a38b49d8a", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.1812631967057033, "ground_truth": 0}, {"key": "c62ea6aaf31a7f5b6a7c2eac7780c86f9baed786", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.5136684846178144, "ground_truth": 0}, {"key": "c62ea6aaf31a7f5b6a7c2eac7780c86f9baed786", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.7505527417764565, "ground_truth": 0}, {"key": "c62ea6aaf31a7f5b6a7c2eac7780c86f9baed786", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.25832599487956875, "ground_truth": 0}, {"key": "c62ea6aaf31a7f5b6a7c2eac7780c86f9baed786", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.30569734375512964, "ground_truth": 0}, {"key": "c62ea6aaf31a7f5b6a7c2eac7780c86f9baed786", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.3979384232712653, "ground_truth": 0}, {"key": "6bb04883f35820a450ff821eda46a4002c0fc7e9", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.49414089089839763, "ground_truth": 0}, {"key": "6bb04883f35820a450ff821eda46a4002c0fc7e9", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.3073580171832131, "ground_truth": 0}, {"key": "6bb04883f35820a450ff821eda46a4002c0fc7e9", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.5389832021585927, "ground_truth": 0}, {"key": "6bb04883f35820a450ff821eda46a4002c0fc7e9", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.5019531254861811, "ground_truth": 0}, {"key": "6bb04883f35820a450ff821eda46a4002c0fc7e9", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.4707366055207644, "ground_truth": 0}, {"key": "71f87a7cbda73f1c0656d811b0026437e4ee4aa0", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.30404168151165706, "ground_truth": 0}, {"key": "71f87a7cbda73f1c0656d811b0026437e4ee4aa0", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.9105453969197631, "ground_truth": 0}, {"key": "71f87a7cbda73f1c0656d811b0026437e4ee4aa0", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.49609382660458107, "ground_truth": 0}, {"key": "71f87a7cbda73f1c0656d811b0026437e4ee4aa0", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.6352224497853962, "ground_truth": 0}, {"key": "71f87a7cbda73f1c0656d811b0026437e4ee4aa0", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.6636689396186974, "ground_truth": 0}, {"key": "fa5089d759a9fb810d28c140cf60e3a5fffff8ba", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.2861692423678628, "ground_truth": 0}, {"key": "fa5089d759a9fb810d28c140cf60e3a5fffff8ba", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.067546693846259, "ground_truth": 0}, {"key": "fa5089d759a9fb810d28c140cf60e3a5fffff8ba", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.13117324012270581, "ground_truth": 0}, {"key": "fa5089d759a9fb810d28c140cf60e3a5fffff8ba", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.5, "ground_truth": 0}, {"key": "fa5089d759a9fb810d28c140cf60e3a5fffff8ba", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.2568319937252944, "ground_truth": 0}, {"key": "1f9aed77465301d7f3787a29555754a03728c4b7", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.35398628507965824, "ground_truth": 0}, {"key": "1f9aed77465301d7f3787a29555754a03728c4b7", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.07585818345188741, "ground_truth": 0}, {"key": "1f9aed77465301d7f3787a29555754a03728c4b7", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.3720487547180454, "ground_truth": 0}, {"key": "1f9aed77465301d7f3787a29555754a03728c4b7", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.32423539132102547, "ground_truth": 0}, {"key": "1f9aed77465301d7f3787a29555754a03728c4b7", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.14804720053909357, "ground_truth": 0}, {"key": "7237201bcb7291f2ededb818f901a451356db34b", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.4436004452928884, "ground_truth": 0}, {"key": "7237201bcb7291f2ededb818f901a451356db34b", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.37387580473960136, "ground_truth": 0}, {"key": "7237201bcb7291f2ededb818f901a451356db34b", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.43206340263495996, "ground_truth": 0}, {"key": "7237201bcb7291f2ededb818f901a451356db34b", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.18594718891318932, "ground_truth": 0}, {"key": "7237201bcb7291f2ededb818f901a451356db34b", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.432063384575766, "ground_truth": 0}, {"key": "38d13d78fedc889784ffb3cb213a758c758be145", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.1613202337802997, "ground_truth": 0}, {"key": "38d13d78fedc889784ffb3cb213a758c758be145", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.24798744794212987, "ground_truth": 0}, {"key": "38d13d78fedc889784ffb3cb213a758c758be145", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.29421495964380906, "ground_truth": 0}, {"key": "38d13d78fedc889784ffb3cb213a758c758be145", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.10594828852500071, "ground_truth": 0}, {"key": "38d13d78fedc889784ffb3cb213a758c758be145", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.24508501946558642, "ground_truth": 0}, {"key": "98fd4b91ec12241a96493471a3e21c9ab96ec523", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.357567517960528, "ground_truth": 0}, {"key": "98fd4b91ec12241a96493471a3e21c9ab96ec523", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.5136684523867695, "ground_truth": 0}, {"key": "98fd4b91ec12241a96493471a3e21c9ab96ec523", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.45326184312503864, "ground_truth": 0}, {"key": "98fd4b91ec12241a96493471a3e21c9ab96ec523", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.3812195576486186, "ground_truth": 0}, {"key": "98fd4b91ec12241a96493471a3e21c9ab96ec523", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.259825665126721, "ground_truth": 0}, {"key": "8cefdd23a829375abeb18b9bd44bb053a67dfdf8", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.35577489697451364, "ground_truth": 0}, {"key": "8cefdd23a829375abeb18b9bd44bb053a67dfdf8", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.3629692026213186, "ground_truth": 0}, {"key": "8cefdd23a829375abeb18b9bd44bb053a67dfdf8", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.5389832252339296, "ground_truth": 0}, {"key": "8cefdd23a829375abeb18b9bd44bb053a67dfdf8", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.27512971775148065, "ground_truth": 0}, {"key": "8cefdd23a829375abeb18b9bd44bb053a67dfdf8", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.34687308133710576, "ground_truth": 0}, {"key": "3de916a84cae6c1dee0076f4e5d6e26fc95c3242", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.5660185241617265, "ground_truth": 0}, {"key": "3de916a84cae6c1dee0076f4e5d6e26fc95c3242", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.6671476611536379, "ground_truth": 0}, {"key": "3de916a84cae6c1dee0076f4e5d6e26fc95c3242", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.5755879927532346, "ground_truth": 0}, {"key": "3de916a84cae6c1dee0076f4e5d6e26fc95c3242", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.5907791985467054, "ground_truth": 0}, {"key": "3de916a84cae6c1dee0076f4e5d6e26fc95c3242", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.5, "ground_truth": 0}, {"key": "24611abacb038c28a84c76b10165e474ac0fdd7e", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.2674081575403363, "ground_truth": 0}, {"key": "24611abacb038c28a84c76b10165e474ac0fdd7e", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.19193278598301328, "ground_truth": 0}, {"key": "24611abacb038c28a84c76b10165e474ac0fdd7e", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.2538610151756883, "ground_truth": 0}, {"key": "24611abacb038c28a84c76b10165e474ac0fdd7e", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.2613309270993203, "ground_truth": 0}, {"key": "24611abacb038c28a84c76b10165e474ac0fdd7e", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.27669054859351105, "ground_truth": 0}, {"key": "4f3178963b84a0e3625f7486b045872c665073d7", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.12678517295528008, "ground_truth": 0}, {"key": "4f3178963b84a0e3625f7486b045872c665073d7", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.9111797154043559, "ground_truth": 0}, {"key": "4f3178963b84a0e3625f7486b045872c665073d7", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.7185943871835478, "ground_truth": 0}, {"key": "4f3178963b84a0e3625f7486b045872c665073d7", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.2553436766116736, "ground_truth": 0}, {"key": "4f3178963b84a0e3625f7486b045872c665073d7", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.8019358254924329, "ground_truth": 0}, {"key": "6ff0470115b556c80229f4305c23afa683c9f8da", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.31912137729114465, "ground_truth": 0}, {"key": "6ff0470115b556c80229f4305c23afa683c9f8da", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.4882834027655498, "ground_truth": 0}, {"key": "6ff0470115b556c80229f4305c23afa683c9f8da", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.2751297167890728, "ground_truth": 0}, {"key": "6ff0470115b556c80229f4305c23afa683c9f8da", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.21866936577566248, "ground_truth": 0}, {"key": "6ff0470115b556c80229f4305c23afa683c9f8da", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.45713670754180596, "ground_truth": 0}, {"key": "4be9a7e5e9115eb681541c4a8d247ac84f0eb774", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.32939171168288706, "ground_truth": 0}, {"key": "4be9a7e5e9115eb681541c4a8d247ac84f0eb774", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.29421497324426826, "ground_truth": 0}, {"key": "4be9a7e5e9115eb681541c4a8d247ac84f0eb774", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.31069436875511763, "ground_truth": 0}, {"key": "4be9a7e5e9115eb681541c4a8d247ac84f0eb774", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.20307462694214296, "ground_truth": 0}, {"key": "4be9a7e5e9115eb681541c4a8d247ac84f0eb774", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.6001883653224399, "ground_truth": 0}, {"key": "de3ba4e29501a10effcbb5a61e7b9c0ab3721669", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.3208213056913172, "ground_truth": 0}, {"key": "de3ba4e29501a10effcbb5a61e7b9c0ab3721669", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.5486734937201145, "ground_truth": 0}, {"key": "de3ba4e29501a10effcbb5a61e7b9c0ab3721669", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.16667541402687142, "ground_truth": 0}, {"key": "de3ba4e29501a10effcbb5a61e7b9c0ab3721669", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.23510837381574812, "ground_truth": 0}, {"key": "de3ba4e29501a10effcbb5a61e7b9c0ab3721669", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.44939265532905376, "ground_truth": 0}, {"key": "d23090b75384c925e7f20b1ec5218394b52eae38", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.39420094571910297, "ground_truth": 0}, {"key": "d23090b75384c925e7f20b1ec5218394b52eae38", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.42250464208434, "ground_truth": 0}, {"key": "d23090b75384c925e7f20b1ec5218394b52eae38", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.4436004003592804, "ground_truth": 0}, {"key": "d23090b75384c925e7f20b1ec5218394b52eae38", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.2613309190202522, "ground_truth": 0}, {"key": "d23090b75384c925e7f20b1ec5218394b52eae38", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.5869964285531264, "ground_truth": 0}, {"key": "98008fdd5ea99bc7c437d6e1aa86c750bf667415", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.30735802064845014, "ground_truth": 0}, {"key": "98008fdd5ea99bc7c437d6e1aa86c750bf667415", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.42632159819715476, "ground_truth": 0}, {"key": "98008fdd5ea99bc7c437d6e1aa86c750bf667415", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.36296918986971455, "ground_truth": 0}, {"key": "98008fdd5ea99bc7c437d6e1aa86c750bf667415", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.34864513216972576, "ground_truth": 0}, {"key": "98008fdd5ea99bc7c437d6e1aa86c750bf667415", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.18594718209088484, "ground_truth": 0}, {"key": "fd13c81373473f862d0f3559ffbc2a03fa95f492", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.5583269952207429, "ground_truth": 0}, {"key": "fd13c81373473f862d0f3559ffbc2a03fa95f492", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.43206339305980684, "ground_truth": 0}, {"key": "fd13c81373473f862d0f3559ffbc2a03fa95f492", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.1824255303006599, "ground_truth": 0}, {"key": "fd13c81373473f862d0f3559ffbc2a03fa95f492", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.3451052782169504, "ground_truth": 0}, {"key": "fd13c81373473f862d0f3559ffbc2a03fa95f492", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.3023910725188214, "ground_truth": 0}, {"key": "ad275932d9fb03762cc781e06955fb088e165ad9", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.5621764961867493, "ground_truth": 0}, {"key": "ad275932d9fb03762cc781e06955fb088e165ad9", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.11516223268972893, "ground_truth": 0}, {"key": "ad275932d9fb03762cc781e06955fb088e165ad9", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.2782567953548519, "ground_truth": 0}, {"key": "ad275932d9fb03762cc781e06955fb088e165ad9", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.30074559679343055, "ground_truth": 0}, {"key": "ad275932d9fb03762cc781e06955fb088e165ad9", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.24220563407784562, "ground_truth": 0}, {"key": "f9fedde4734d8ac3431c0ed5d338efcd799b1aea", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.2422056090096499, "ground_truth": 0}, {"key": "f9fedde4734d8ac3431c0ed5d338efcd799b1aea", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.2628418387164803, "ground_truth": 0}, {"key": "f9fedde4734d8ac3431c0ed5d338efcd799b1aea", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.15610488079301613, "ground_truth": 0}, {"key": "f9fedde4734d8ac3431c0ed5d338efcd799b1aea", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.1571368542487957, "ground_truth": 0}, {"key": "f9fedde4734d8ac3431c0ed5d338efcd799b1aea", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.1801066597442189, "ground_truth": 0}, {"key": "bbe84a85e38aac4e2cff76da7ce4ed349474db25", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.3293917037567783, "ground_truth": 0}, {"key": "bbe84a85e38aac4e2cff76da7ce4ed349474db25", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.2991051983303535, "ground_truth": 0}, {"key": "bbe84a85e38aac4e2cff76da7ce4ed349474db25", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.22000711179448337, "ground_truth": 0}, {"key": "bbe84a85e38aac4e2cff76da7ce4ed349474db25", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.26284182308250814, "ground_truth": 0}, {"key": "bbe84a85e38aac4e2cff76da7ce4ed349474db25", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.25832597409287106, "ground_truth": 0}, {"key": "45884af9aff9abf54fec27f510c3f9ed000fc6e1", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.2365162316022457, "ground_truth": 0}, {"key": "45884af9aff9abf54fec27f510c3f9ed000fc6e1", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.3451052669432052, "ground_truth": 0}, {"key": "45884af9aff9abf54fec27f510c3f9ed000fc6e1", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.462958636968593, "ground_truth": 0}, {"key": "45884af9aff9abf54fec27f510c3f9ed000fc6e1", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.5660185297033344, "ground_truth": 0}, {"key": "45884af9aff9abf54fec27f510c3f9ed000fc6e1", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.49414088155261415, "ground_truth": 0}, {"key": "59e60ba3c7ea5f5991db8ed4afd368c69e697dde", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.14318770298570574, "ground_truth": 0}, {"key": "59e60ba3c7ea5f5991db8ed4afd368c69e697dde", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.2689414323796572, "ground_truth": 0}, {"key": "59e60ba3c7ea5f5991db8ed4afd368c69e697dde", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.5370413726662333, "ground_truth": 0}, {"key": "59e60ba3c7ea5f5991db8ed4afd368c69e697dde", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.8418256451421617, "ground_truth": 0}, {"key": "59e60ba3c7ea5f5991db8ed4afd368c69e697dde", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.3363310590323671, "ground_truth": 0}, {"key": "265ad4cbd8cbad94527db327a39c2d8f33db33ce", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.2133771622751321, "ground_truth": 0}, {"key": "265ad4cbd8cbad94527db327a39c2d8f33db33ce", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.2909808757094353, "ground_truth": 0}, {"key": "265ad4cbd8cbad94527db327a39c2d8f33db33ce", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.3380771103204247, "ground_truth": 0}, {"key": "265ad4cbd8cbad94527db327a39c2d8f33db33ce", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.29259527413538494, "ground_truth": 0}, {"key": "265ad4cbd8cbad94527db327a39c2d8f33db33ce", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.2782567781971468, "ground_truth": 0}, {"key": "54e68f9b7cdd209c09b2a47feef62b9082346031", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.6548947247682595, "ground_truth": 0}, {"key": "54e68f9b7cdd209c09b2a47feef62b9082346031", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.33982762133436856, "ground_truth": 0}, {"key": "54e68f9b7cdd209c09b2a47feef62b9082346031", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.33633105875189356, "ground_truth": 0}, {"key": "54e68f9b7cdd209c09b2a47feef62b9082346031", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.2613309221739396, "ground_truth": 0}, {"key": "54e68f9b7cdd209c09b2a47feef62b9082346031", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.3451052761381007, "ground_truth": 0}, {"key": "3b5e3dff560e2233e8370c87e9d92461200f8bd4", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.26588047017029687, "ground_truth": 0}, {"key": "3b5e3dff560e2233e8370c87e9d92461200f8bd4", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.30239108258408093, "ground_truth": 0}, {"key": "3b5e3dff560e2233e8370c87e9d92461200f8bd4", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.30902372111114945, "ground_truth": 0}, {"key": "3b5e3dff560e2233e8370c87e9d92461200f8bd4", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.3191213817403299, "ground_truth": 0}, {"key": "3b5e3dff560e2233e8370c87e9d92461200f8bd4", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.2893717055018799, "ground_truth": 0}, {"key": "242c51d129c998a2585feee12e109a2058eb7c2b", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.38861802154424974, "ground_truth": 0}, {"key": "242c51d129c998a2585feee12e109a2058eb7c2b", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.5350984298920508, "ground_truth": 0}, {"key": "242c51d129c998a2585feee12e109a2058eb7c2b", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.24508500756593546, "ground_truth": 0}, {"key": "242c51d129c998a2585feee12e109a2058eb7c2b", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.3684056963823901, "ground_truth": 0}, {"key": "242c51d129c998a2585feee12e109a2058eb7c2b", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.3557749279077089, "ground_truth": 0}, {"key": "5ce92746bc1f4f5cbb25956c1289ffcd7f50f07e", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.30569732343638667, "ground_truth": 0}, {"key": "5ce92746bc1f4f5cbb25956c1289ffcd7f50f07e", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.2598256405889957, "ground_truth": 0}, {"key": "5ce92746bc1f4f5cbb25956c1289ffcd7f50f07e", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.069037928690912, "ground_truth": 0}, {"key": "5ce92746bc1f4f5cbb25956c1289ffcd7f50f07e", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.12940272772912473, "ground_truth": 0}, {"key": "5ce92746bc1f4f5cbb25956c1289ffcd7f50f07e", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.15405756475369592, "ground_truth": 0}, {"key": "2f32a9eebbfa707a264d82a3bef5557f6b3b5f20", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.3720488067257479, "ground_truth": 0}, {"key": "2f32a9eebbfa707a264d82a3bef5557f6b3b5f20", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.3328523336319097, "ground_truth": 0}, {"key": "2f32a9eebbfa707a264d82a3bef5557f6b3b5f20", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.49414089467943584, "ground_truth": 0}, {"key": "2f32a9eebbfa707a264d82a3bef5557f6b3b5f20", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.5907792166079398, "ground_truth": 0}, {"key": "2f32a9eebbfa707a264d82a3bef5557f6b3b5f20", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.4054487337132658, "ground_truth": 0}, {"key": "57a373fa7d17600396fcee99164e79c0edccad14", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.5467381345152513, "ground_truth": 0}, {"key": "57a373fa7d17600396fcee99164e79c0edccad14", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.5794003877172622, "ground_truth": 0}, {"key": "57a373fa7d17600396fcee99164e79c0edccad14", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.7690802380076883, "ground_truth": 0}, {"key": "57a373fa7d17600396fcee99164e79c0edccad14", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.6187804257690879, "ground_truth": 0}, {"key": "57a373fa7d17600396fcee99164e79c0edccad14", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.4590761452359902, "ground_truth": 0}, {"key": "9b087c5572cc091c519625d37d1a614b97b8ed30", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.689305603733075, "ground_truth": 0}, {"key": "9b087c5572cc091c519625d37d1a614b97b8ed30", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.4148988517602364, "ground_truth": 0}, {"key": "9b087c5572cc091c519625d37d1a614b97b8ed30", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.21601154274396098, "ground_truth": 0}, {"key": "9b087c5572cc091c519625d37d1a614b97b8ed30", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.2782568118383698, "ground_truth": 0}, {"key": "9b087c5572cc091c519625d37d1a614b97b8ed30", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.5506073564666637, "ground_truth": 0}, {"key": "b5211115ff68e12e759a474a02d3b163211af563", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.5506073833852674, "ground_truth": 0}, {"key": "b5211115ff68e12e759a474a02d3b163211af563", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.6548947203105931, "ground_truth": 0}, {"key": "b5211115ff68e12e759a474a02d3b163211af563", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.8407825931453602, "ground_truth": 0}, {"key": "b5211115ff68e12e759a474a02d3b163211af563", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.7634837733142729, "ground_truth": 0}, {"key": "b5211115ff68e12e759a474a02d3b163211af563", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.5312093889135383, "ground_truth": 0}, {"key": "6b75abea2de5c9c9952af0427ccec78910ac811f", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.5679365982034345, "ground_truth": 0}, {"key": "6b75abea2de5c9c9952af0427ccec78910ac811f", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.32082129493068434, "ground_truth": 0}, {"key": "6b75abea2de5c9c9952af0427ccec78910ac811f", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.17217184229103194, "ground_truth": 0}, {"key": "6b75abea2de5c9c9952af0427ccec78910ac811f", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.5448013974794081, "ground_truth": 0}, {"key": "6b75abea2de5c9c9952af0427ccec78910ac811f", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.32766827484448835, "ground_truth": 0}, {"key": "259cc1db3d4c814dafc02ed071327f65a7b9eaad", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.2295352175429567, "ground_truth": 0}, {"key": "259cc1db3d4c814dafc02ed071327f65a7b9eaad", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.45519858025749393, "ground_truth": 0}, {"key": "259cc1db3d4c814dafc02ed071327f65a7b9eaad", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.22135069208615513, "ground_truth": 0}, {"key": "259cc1db3d4c814dafc02ed071327f65a7b9eaad", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.2213506941818297, "ground_truth": 0}, {"key": "259cc1db3d4c814dafc02ed071327f65a7b9eaad", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.28457602198336607, "ground_truth": 0}, {"key": "3bb1cda1e01cb6e14f6190ced3b1ec3f7ef50de9", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.28457597525605793, "ground_truth": 0}, {"key": "3bb1cda1e01cb6e14f6190ced3b1ec3f7ef50de9", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.10894504383082707, "ground_truth": 0}, {"key": "3bb1cda1e01cb6e14f6190ced3b1ec3f7ef50de9", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.3073579939190669, "ground_truth": 0}, {"key": "3bb1cda1e01cb6e14f6190ced3b1ec3f7ef50de9", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.28298809403017927, "ground_truth": 0}, {"key": "3bb1cda1e01cb6e14f6190ced3b1ec3f7ef50de9", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.42632159831682065, "ground_truth": 0}, {"key": "7afbe903f1f7cdc1af509583649babf481d01729", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.48242908989662553, "ground_truth": 0}, {"key": "7afbe903f1f7cdc1af509583649babf481d01729", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.6548947388639241, "ground_truth": 0}, {"key": "7afbe903f1f7cdc1af509583649babf481d01729", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.2658804766336145, "ground_truth": 0}, {"key": "7afbe903f1f7cdc1af509583649babf481d01729", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.39233681649503827, "ground_truth": 0}, {"key": "7afbe903f1f7cdc1af509583649babf481d01729", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.2877678361114198, "ground_truth": 0}, {"key": "79d625a3311f4ff11598a3ae4fca63103e84e9a1", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.2583259992439475, "ground_truth": 0}, {"key": "79d625a3311f4ff11598a3ae4fca63103e84e9a1", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.24220563365186937, "ground_truth": 0}, {"key": "79d625a3311f4ff11598a3ae4fca63103e84e9a1", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.3539862884765071, "ground_truth": 0}, {"key": "79d625a3311f4ff11598a3ae4fca63103e84e9a1", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.2942149823368912, "ground_truth": 0}, {"key": "79d625a3311f4ff11598a3ae4fca63103e84e9a1", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.2829881047622901, "ground_truth": 0}, {"key": "ea6c4267f17d55f1bd9f0950c31ef59565bdc30b", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.3208213123463041, "ground_truth": 0}, {"key": "ea6c4267f17d55f1bd9f0950c31ef59565bdc30b", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.3345894359597954, "ground_truth": 0}, {"key": "ea6c4267f17d55f1bd9f0950c31ef59565bdc30b", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.32766829512142887, "ground_truth": 0}, {"key": "ea6c4267f17d55f1bd9f0950c31ef59565bdc30b", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.3007455806101782, "ground_truth": 0}, {"key": "ea6c4267f17d55f1bd9f0950c31ef59565bdc30b", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.4551985979993502, "ground_truth": 0}, {"key": "851d02b689bec14607574096bb77b9acf53c15ee", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.17328821201628553, "ground_truth": 0}, {"key": "851d02b689bec14607574096bb77b9acf53c15ee", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.5058590845160917, "ground_truth": 0}, {"key": "851d02b689bec14607574096bb77b9acf53c15ee", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.2689414022256946, "ground_truth": 0}, {"key": "851d02b689bec14607574096bb77b9acf53c15ee", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.16344543157308095, "ground_truth": 0}, {"key": "851d02b689bec14607574096bb77b9acf53c15ee", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.2958398830599952, "ground_truth": 0}, {"key": "f2d00c8c396698becc18fd2b41ba595c7a3e1cc6", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.948537229962957, "ground_truth": 0}, {"key": "f2d00c8c396698becc18fd2b41ba595c7a3e1cc6", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.9940659326513447, "ground_truth": 0}, {"key": "f2d00c8c396698becc18fd2b41ba595c7a3e1cc6", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.870597260552955, "ground_truth": 0}, {"key": "f2d00c8c396698becc18fd2b41ba595c7a3e1cc6", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.9559813493234195, "ground_truth": 0}, {"key": "f2d00c8c396698becc18fd2b41ba595c7a3e1cc6", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.9522199326319883, "ground_truth": 0}, {"key": "70c6ca3234f9b1221c8aea7671dd78e1ca9d9139", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.10894504510273044, "ground_truth": 0}, {"key": "70c6ca3234f9b1221c8aea7671dd78e1ca9d9139", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.35398630374272155, "ground_truth": 0}, {"key": "70c6ca3234f9b1221c8aea7671dd78e1ca9d9139", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.11596071968134583, "ground_truth": 0}, {"key": "70c6ca3234f9b1221c8aea7671dd78e1ca9d9139", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.30239108348986526, "ground_truth": 0}, {"key": "70c6ca3234f9b1221c8aea7671dd78e1ca9d9139", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.45132646719648056, "ground_truth": 0}, {"key": "86eaa90c419d5ed93341248fecd8c25d820f2b82", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.25982564911970457, "ground_truth": 0}, {"key": "86eaa90c419d5ed93341248fecd8c25d820f2b82", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.4649015731596353, "ground_truth": 0}, {"key": "86eaa90c419d5ed93341248fecd8c25d820f2b82", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.20561503757838562, "ground_truth": 0}, {"key": "86eaa90c419d5ed93341248fecd8c25d820f2b82", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.29746994262199494, "ground_truth": 0}, {"key": "86eaa90c419d5ed93341248fecd8c25d820f2b82", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.2674081631794927, "ground_truth": 0}, {"key": "a1841cf61c53937fffc54c0e81d8f7cfcad2f0c2", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.12678516887437932, "ground_truth": 0}, {"key": "a1841cf61c53937fffc54c0e81d8f7cfcad2f0c2", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.19314739278936435, "ground_truth": 0}, {"key": "a1841cf61c53937fffc54c0e81d8f7cfcad2f0c2", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.1441488368586695, "ground_truth": 0}, {"key": "a1841cf61c53937fffc54c0e81d8f7cfcad2f0c2", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.11516223941598584, "ground_truth": 0}, {"key": "a1841cf61c53937fffc54c0e81d8f7cfcad2f0c2", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.29421498193078977, "ground_truth": 0}, {"key": "5d221c86fdadca378eeaabc39c881cc74efcff07", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.04501553451599516, "ground_truth": 0}, {"key": "5d221c86fdadca378eeaabc39c881cc74efcff07", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.06656919001187078, "ground_truth": 0}, {"key": "5d221c86fdadca378eeaabc39c881cc74efcff07", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.9235923230540578, "ground_truth": 0}, {"key": "5d221c86fdadca378eeaabc39c881cc74efcff07", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.1167640100590502, "ground_truth": 0}, {"key": "5d221c86fdadca378eeaabc39c881cc74efcff07", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.2160115224750272, "ground_truth": 0}, {"key": "7a49f5bc1d336309f57076bceba91885ee5368b5", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.5370413958446117, "ground_truth": 0}, {"key": "7a49f5bc1d336309f57076bceba91885ee5368b5", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.5409238409896413, "ground_truth": 0}, {"key": "7a49f5bc1d336309f57076bceba91885ee5368b5", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.34158251007913315, "ground_truth": 0}, {"key": "7a49f5bc1d336309f57076bceba91885ee5368b5", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.5117165991639306, "ground_truth": 0}, {"key": "7a49f5bc1d336309f57076bceba91885ee5368b5", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.7310585840348063, "ground_truth": 0}, {"key": "dd46893fd318dce4e209f9a335612659ebf8fd24", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.2782567701847052, "ground_truth": 0}, {"key": "dd46893fd318dce4e209f9a335612659ebf8fd24", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.7386691006548233, "ground_truth": 0}, {"key": "dd46893fd318dce4e209f9a335612659ebf8fd24", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.2766905234308831, "ground_truth": 0}, {"key": "dd46893fd318dce4e209f9a335612659ebf8fd24", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.40922079848868637, "ground_truth": 0}, {"key": "dd46893fd318dce4e209f9a335612659ebf8fd24", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.4378234798880538, "ground_truth": 0}, {"key": "acda8749fba5e9553e9f47cef89ef85eae5ad4e3", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.5506073273960234, "ground_truth": 0}, {"key": "acda8749fba5e9553e9f47cef89ef85eae5ad4e3", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.41300356757041873, "ground_truth": 0}, {"key": "acda8749fba5e9553e9f47cef89ef85eae5ad4e3", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.6297746098528443, "ground_truth": 0}, {"key": "acda8749fba5e9553e9f47cef89ef85eae5ad4e3", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.5583269769299154, "ground_truth": 0}, {"key": "acda8749fba5e9553e9f47cef89ef85eae5ad4e3", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.6926419542325187, "ground_truth": 0}, {"key": "20b11518df6520f552d691d5f6c0d02755d11809", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.3208213025060022, "ground_truth": 0}, {"key": "20b11518df6520f552d691d5f6c0d02755d11809", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.13386748307760077, "ground_truth": 0}, {"key": "20b11518df6520f552d691d5f6c0d02755d11809", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.15405755715759162, "ground_truth": 0}, {"key": "20b11518df6520f552d691d5f6c0d02755d11809", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.09467770118652642, "ground_truth": 0}, {"key": "20b11518df6520f552d691d5f6c0d02755d11809", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.15203222961293236, "ground_truth": 0}, {"key": "51fe083191bb5568bf6a5fea1610a8e19663d7b2", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.34687305981141153, "ground_truth": 0}, {"key": "51fe083191bb5568bf6a5fea1610a8e19663d7b2", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.46295862214335026, "ground_truth": 0}, {"key": "51fe083191bb5568bf6a5fea1610a8e19663d7b2", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.4746311915413124, "ground_truth": 0}, {"key": "51fe083191bb5568bf6a5fea1610a8e19663d7b2", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.6370307792031689, "ground_truth": 0}, {"key": "51fe083191bb5568bf6a5fea1610a8e19663d7b2", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.47852885553140073, "ground_truth": 0}, {"key": "8af047c2d83a91e8b745adfcaa7c282dfe1030a2", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.24653333700505828, "ground_truth": 0}, {"key": "8af047c2d83a91e8b745adfcaa7c282dfe1030a2", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.276690543292147, "ground_truth": 0}, {"key": "8af047c2d83a91e8b745adfcaa7c282dfe1030a2", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.20181321607271846, "ground_truth": 0}, {"key": "8af047c2d83a91e8b745adfcaa7c282dfe1030a2", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.15713686132131727, "ground_truth": 0}, {"key": "8af047c2d83a91e8b745adfcaa7c282dfe1030a2", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.2538610273841231, "ground_truth": 0}, {"key": "dfcacd955a9168b2cf599c57a539dbfce43ea2a9", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.2958398769445976, "ground_truth": 0}, {"key": "dfcacd955a9168b2cf599c57a539dbfce43ea2a9", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.449392659163265, "ground_truth": 0}, {"key": "dfcacd955a9168b2cf599c57a539dbfce43ea2a9", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.18952109733043931, "ground_truth": 0}, {"key": "dfcacd955a9168b2cf599c57a539dbfce43ea2a9", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.4092208104902272, "ground_truth": 0}, {"key": "dfcacd955a9168b2cf599c57a539dbfce43ea2a9", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.5448014054565418, "ground_truth": 0}, {"key": "f2463954bc7215d8a1f98cf0d85f280fd2affa58", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.41489885094970913, "ground_truth": 0}, {"key": "f2463954bc7215d8a1f98cf0d85f280fd2affa58", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.5467381550901711, "ground_truth": 0}, {"key": "f2463954bc7215d8a1f98cf0d85f280fd2affa58", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.5350984335078371, "ground_truth": 0}, {"key": "f2463954bc7215d8a1f98cf0d85f280fd2affa58", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.32939171533259864, "ground_truth": 0}, {"key": "f2463954bc7215d8a1f98cf0d85f280fd2affa58", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.36296921552276834, "ground_truth": 0}, {"key": "0e7a92a6f06e94cdd613860d4a3f4b92a06a2b43", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.4186969170677045, "ground_truth": 0}, {"key": "0e7a92a6f06e94cdd613860d4a3f4b92a06a2b43", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.5813030859992733, "ground_truth": 0}, {"key": "0e7a92a6f06e94cdd613860d4a3f4b92a06a2b43", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.42250464710736385, "ground_truth": 0}, {"key": "0e7a92a6f06e94cdd613860d4a3f4b92a06a2b43", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.5195213501708917, "ground_truth": 0}, {"key": "0e7a92a6f06e94cdd613860d4a3f4b92a06a2b43", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.7154239778185199, "ground_truth": 0}, {"key": "2905a15c5947042e42f4b52dc201d24822af20f1", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.30404169080223636, "ground_truth": 0}, {"key": "2905a15c5947042e42f4b52dc201d24822af20f1", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.4130035831424359, "ground_truth": 0}, {"key": "2905a15c5947042e42f4b52dc201d24822af20f1", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.43014737519990903, "ground_truth": 0}, {"key": "2905a15c5947042e42f4b52dc201d24822af20f1", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.3106943657948674, "ground_truth": 0}, {"key": "2905a15c5947042e42f4b52dc201d24822af20f1", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.5794003952368989, "ground_truth": 0}, {"key": "808a3d788317af05686ee71a71d2fbc5c19267bc", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.44746029159047995, "ground_truth": 0}, {"key": "808a3d788317af05686ee71a71d2fbc5c19267bc", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.35936414255326005, "ground_truth": 0}, {"key": "808a3d788317af05686ee71a71d2fbc5c19267bc", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.44939265477003637, "ground_truth": 0}, {"key": "808a3d788317af05686ee71a71d2fbc5c19267bc", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.3225259587493407, "ground_truth": 0}, {"key": "808a3d788317af05686ee71a71d2fbc5c19267bc", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.2909808779374569, "ground_truth": 0}, {"key": "5a1bec30205b6938392f3119366e27d15b4849e8", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.23231014490169294, "ground_truth": 0}, {"key": "5a1bec30205b6938392f3119366e27d15b4849e8", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.1744102792187572, "ground_truth": 0}, {"key": "5a1bec30205b6938392f3119366e27d15b4849e8", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.1688569550972072, "ground_truth": 0}, {"key": "5a1bec30205b6938392f3119366e27d15b4849e8", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.2323101477434875, "ground_truth": 0}, {"key": "5a1bec30205b6938392f3119366e27d15b4849e8", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.10818895551751924, "ground_truth": 0}, {"key": "7ff39e1220c0f084434786ed145e15c6abe48def", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.5907791955950553, "ground_truth": 0}, {"key": "7ff39e1220c0f084434786ed145e15c6abe48def", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.48828337430646046, "ground_truth": 0}, {"key": "7ff39e1220c0f084434786ed145e15c6abe48def", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.5926665986217239, "ground_truth": 0}, {"key": "7ff39e1220c0f084434786ed145e15c6abe48def", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.5794004026735834, "ground_truth": 0}, {"key": "7ff39e1220c0f084434786ed145e15c6abe48def", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.6132365319218043, "ground_truth": 0}, {"key": "7551503e7e57bd519913b0df90ca1e80d5305b05", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.4746311932368172, "ground_truth": 0}, {"key": "7551503e7e57bd519913b0df90ca1e80d5305b05", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.769080221848385, "ground_truth": 0}, {"key": "7551503e7e57bd519913b0df90ca1e80d5305b05", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.30735798275093035, "ground_truth": 0}, {"key": "7551503e7e57bd519913b0df90ca1e80d5305b05", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.3867634557245118, "ground_truth": 0}, {"key": "7551503e7e57bd519913b0df90ca1e80d5305b05", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.20055768451649697, "ground_truth": 0}, {"key": "c34a0cbf6db61323766fc86b1b89b399ff6b0666", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.6039318385942198, "ground_truth": 0}, {"key": "c34a0cbf6db61323766fc86b1b89b399ff6b0666", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.25238404727957825, "ground_truth": 0}, {"key": "c34a0cbf6db61323766fc86b1b89b399ff6b0666", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.4073334135919313, "ground_truth": 0}, {"key": "c34a0cbf6db61323766fc86b1b89b399ff6b0666", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.26133095284086066, "ground_truth": 0}, {"key": "c34a0cbf6db61323766fc86b1b89b399ff6b0666", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.4532618761579324, "ground_truth": 0}, {"key": "d07a61368a195444b14bd4b382e0fc3d64890b22", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.27669052042143044, "ground_truth": 0}, {"key": "d07a61368a195444b14bd4b382e0fc3d64890b22", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.19806416737225943, "ground_truth": 0}, {"key": "d07a61368a195444b14bd4b382e0fc3d64890b22", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.47268346426515767, "ground_truth": 0}, {"key": "d07a61368a195444b14bd4b382e0fc3d64890b22", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.2379298837986068, "ground_truth": 0}, {"key": "d07a61368a195444b14bd4b382e0fc3d64890b22", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.14318770319829488, "ground_truth": 0}, {"key": "aa68dee4bc246e5aae9507342f8520a2a301a310", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.09268777240308182, "ground_truth": 0}, {"key": "aa68dee4bc246e5aae9507342f8520a2a301a310", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.13939639408045726, "ground_truth": 0}, {"key": "aa68dee4bc246e5aae9507342f8520a2a301a310", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.25386099587441274, "ground_truth": 0}, {"key": "aa68dee4bc246e5aae9507342f8520a2a301a310", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.14318769549597277, "ground_truth": 0}, {"key": "aa68dee4bc246e5aae9507342f8520a2a301a310", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.17328820907877387, "ground_truth": 0}, {"key": "87ef15064035db73cb29f5cec2f0442f2c527ef0", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.3849121349281275, "ground_truth": 0}, {"key": "87ef15064035db73cb29f5cec2f0442f2c527ef0", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.5117165820844112, "ground_truth": 0}, {"key": "87ef15064035db73cb29f5cec2f0442f2c527ef0", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.5214711487972482, "ground_truth": 0}, {"key": "87ef15064035db73cb29f5cec2f0442f2c527ef0", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.6315943060933066, "ground_truth": 0}, {"key": "87ef15064035db73cb29f5cec2f0442f2c527ef0", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.4882834152611029, "ground_truth": 0}, {"key": "a577b934e210ef7dce07390711f03db8bb2e005a", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.33982762894095825, "ground_truth": 0}, {"key": "a577b934e210ef7dce07390711f03db8bb2e005a", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.47268344620234876, "ground_truth": 0}, {"key": "a577b934e210ef7dce07390711f03db8bb2e005a", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.302391089957201, "ground_truth": 0}, {"key": "a577b934e210ef7dce07390711f03db8bb2e005a", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.4921881441751641, "ground_truth": 0}, {"key": "a577b934e210ef7dce07390711f03db8bb2e005a", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.27357439534911254, "ground_truth": 0}, {"key": "c9414bf55859cb9ca7e925a4a09b416b6f66446a", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.9888419695849961, "ground_truth": 0}, {"key": "c9414bf55859cb9ca7e925a4a09b416b6f66446a", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.9802808727333819, "ground_truth": 0}, {"key": "c9414bf55859cb9ca7e925a4a09b416b6f66446a", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.9850429138506248, "ground_truth": 0}, {"key": "c9414bf55859cb9ca7e925a4a09b416b6f66446a", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.9645892723684818, "ground_truth": 0}, {"key": "c9414bf55859cb9ca7e925a4a09b416b6f66446a", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.9412234402677211, "ground_truth": 0}, {"key": "f12cda150b96acfa1499b2afb0a81029545abadf", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.15002882493632355, "ground_truth": 0}, {"key": "f12cda150b96acfa1499b2afb0a81029545abadf", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.16344544053885665, "ground_truth": 0}, {"key": "f12cda150b96acfa1499b2afb0a81029545abadf", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.39233680265273113, "ground_truth": 0}, {"key": "f12cda150b96acfa1499b2afb0a81029545abadf", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.20817893291671138, "ground_truth": 0}, {"key": "f12cda150b96acfa1499b2afb0a81029545abadf", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.31236999452556286, "ground_truth": 0}, {"key": "7359741b0e60b4402f069963a26c7aa766f45e7c", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.1233656287622719, "ground_truth": 0}, {"key": "7359741b0e60b4402f069963a26c7aa766f45e7c", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.22270013774605044, "ground_truth": 0}, {"key": "7359741b0e60b4402f069963a26c7aa766f45e7c", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.12085324484800385, "ground_truth": 0}, {"key": "7359741b0e60b4402f069963a26c7aa766f45e7c", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.31573597592276126, "ground_truth": 0}, {"key": "7359741b0e60b4402f069963a26c7aa766f45e7c", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.34864513878852965, "ground_truth": 0}, {"key": "b10c71f49dbeabad23325d625e8e7b8529429607", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.19436780229620584, "ground_truth": 0}, {"key": "b10c71f49dbeabad23325d625e8e7b8529429607", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.21337718302194345, "ground_truth": 0}, {"key": "b10c71f49dbeabad23325d625e8e7b8529429607", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.44552954981552745, "ground_truth": 0}, {"key": "b10c71f49dbeabad23325d625e8e7b8529429607", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.29098089149894285, "ground_truth": 0}, {"key": "b10c71f49dbeabad23325d625e8e7b8529429607", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.31573596868638204, "ground_truth": 0}, {"key": "c5a1e04f5f84d406ffedfc2f312c314d1bc03c46", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.18242553024765581, "ground_truth": 0}, {"key": "c5a1e04f5f84d406ffedfc2f312c314d1bc03c46", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.11596071060668682, "ground_truth": 0}, {"key": "c5a1e04f5f84d406ffedfc2f312c314d1bc03c46", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.1602660153768145, "ground_truth": 0}, {"key": "c5a1e04f5f84d406ffedfc2f312c314d1bc03c46", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.28616923173547176, "ground_truth": 0}, {"key": "c5a1e04f5f84d406ffedfc2f312c314d1bc03c46", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.06371498516257905, "ground_truth": 0}, {"key": "8a5035d3527c4db4357dd1db9fb2712008dccea9", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.4785288464992126, "ground_truth": 0}, {"key": "8a5035d3527c4db4357dd1db9fb2712008dccea9", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.45713671386513277, "ground_truth": 0}, {"key": "8a5035d3527c4db4357dd1db9fb2712008dccea9", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.4921881125155715, "ground_truth": 0}, {"key": "8a5035d3527c4db4357dd1db9fb2712008dccea9", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.5583269920955564, "ground_truth": 0}, {"key": "8a5035d3527c4db4357dd1db9fb2712008dccea9", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.5926666011637681, "ground_truth": 0}, {"key": "3f33d4cb25cd121619ba99eeb02709b72716d622", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.7577943682530737, "ground_truth": 0}, {"key": "3f33d4cb25cd121619ba99eeb02709b72716d622", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.6315943230384851, "ground_truth": 0}, {"key": "3f33d4cb25cd121619ba99eeb02709b72716d622", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.7662936282152737, "ground_truth": 0}, {"key": "3f33d4cb25cd121619ba99eeb02709b72716d622", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.7745833899265834, "ground_truth": 0}, {"key": "3f33d4cb25cd121619ba99eeb02709b72716d622", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.5660185333904535, "ground_truth": 0}, {"key": "e6f451d6667f142a64818a9d05dbc49115e7cbf9", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.2643583661475455, "ground_truth": 0}, {"key": "e6f451d6667f142a64818a9d05dbc49115e7cbf9", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.7690802381495632, "ground_truth": 0}, {"key": "e6f451d6667f142a64818a9d05dbc49115e7cbf9", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.4148988045114889, "ground_truth": 0}, {"key": "e6f451d6667f142a64818a9d05dbc49115e7cbf9", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.3647775544381433, "ground_truth": 0}, {"key": "e6f451d6667f142a64818a9d05dbc49115e7cbf9", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.4378234945186816, "ground_truth": 0}, {"key": "39622c01625247af942a6439699ff529db1d54d0", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.03846619371629943, "ground_truth": 0}, {"key": "39622c01625247af942a6439699ff529db1d54d0", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.17328821013443266, "ground_truth": 0}, {"key": "39622c01625247af942a6439699ff529db1d54d0", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.23370637725932641, "ground_truth": 0}, {"key": "39622c01625247af942a6439699ff529db1d54d0", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.10669058318726353, "ground_truth": 0}, {"key": "39622c01625247af942a6439699ff529db1d54d0", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.16132024375638765, "ground_truth": 0}, {"key": "02927c88776bcc84fc883435a5037b4c8ca70e83", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.7371581664823201, "ground_truth": 0}, {"key": "02927c88776bcc84fc883435a5037b4c8ca70e83", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.6992543963828586, "ground_truth": 0}, {"key": "02927c88776bcc84fc883435a5037b4c8ca70e83", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.4980468830511069, "ground_truth": 0}, {"key": "02927c88776bcc84fc883435a5037b4c8ca70e83", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.6791786714046399, "ground_truth": 0}, {"key": "02927c88776bcc84fc883435a5037b4c8ca70e83", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.5832033526762777, "ground_truth": 0}, {"key": "3ee31d8987c07ba4ea9423d39c5e333525316958", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.5350984427438037, "ground_truth": 0}, {"key": "3ee31d8987c07ba4ea9423d39c5e333525316958", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.7138307488581578, "ground_truth": 0}, {"key": "3ee31d8987c07ba4ea9423d39c5e333525316958", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.3793783588642515, "ground_truth": 0}, {"key": "3ee31d8987c07ba4ea9423d39c5e333525316958", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.40922075918981393, "ground_truth": 0}, {"key": "3ee31d8987c07ba4ea9423d39c5e333525316958", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.675764612933884, "ground_truth": 0}, {"key": "f8ddc6d36f378757d27a244529f8fe11672baa41", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.24220563413302731, "ground_truth": 0}, {"key": "f8ddc6d36f378757d27a244529f8fe11672baa41", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.37937840367729064, "ground_truth": 0}, {"key": "f8ddc6d36f378757d27a244529f8fe11672baa41", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.4941409005012356, "ground_truth": 0}, {"key": "f8ddc6d36f378757d27a244529f8fe11672baa41", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.29259530379246745, "ground_truth": 0}, {"key": "f8ddc6d36f378757d27a244529f8fe11672baa41", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.5389832085216574, "ground_truth": 0}, {"key": "4e97228ceef1be54ab9151fc6759017e6a54a18d", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.396068156183824, "ground_truth": 0}, {"key": "4e97228ceef1be54ab9151fc6759017e6a54a18d", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.25238403552772104, "ground_truth": 0}, {"key": "4e97228ceef1be54ab9151fc6759017e6a54a18d", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.4707366065137777, "ground_truth": 0}, {"key": "4e97228ceef1be54ab9151fc6759017e6a54a18d", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.26740814431081356, "ground_truth": 0}, {"key": "4e97228ceef1be54ab9151fc6759017e6a54a18d", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.3979384057568383, "ground_truth": 0}, {"key": "0e649ccabaf0e650e9757ee256c2749d37486ba6", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.3522017712725836, "ground_truth": 0}, {"key": "0e649ccabaf0e650e9757ee256c2749d37486ba6", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.3923368353624874, "ground_truth": 0}, {"key": "0e649ccabaf0e650e9757ee256c2749d37486ba6", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.16559310189708132, "ground_truth": 0}, {"key": "0e649ccabaf0e650e9757ee256c2749d37486ba6", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.2861692439894151, "ground_truth": 0}, {"key": "0e649ccabaf0e650e9757ee256c2749d37486ba6", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.26435833600909964, "ground_truth": 0}, {"key": "9eccfcc231c7c0d65cb0c333cb3d1731a5fe2f3f", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.24653334056170695, "ground_truth": 0}, {"key": "9eccfcc231c7c0d65cb0c333cb3d1731a5fe2f3f", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.7549149674154388, "ground_truth": 0}, {"key": "9eccfcc231c7c0d65cb0c333cb3d1731a5fe2f3f", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.7264256108904005, "ground_truth": 0}, {"key": "9eccfcc231c7c0d65cb0c333cb3d1731a5fe2f3f", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.2407746039749225, "ground_truth": 0}, {"key": "9eccfcc231c7c0d65cb0c333cb3d1731a5fe2f3f", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.22541660819541565, "ground_truth": 0}, {"key": "ddf109b3de6022a4ecd62ee2cd31d2c2ac51035b", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.22953520534303834, "ground_truth": 0}, {"key": "ddf109b3de6022a4ecd62ee2cd31d2c2ac51035b", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.3904758408216061, "ground_truth": 0}, {"key": "ddf109b3de6022a4ecd62ee2cd31d2c2ac51035b", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.41300354265566513, "ground_truth": 0}, {"key": "ddf109b3de6022a4ecd62ee2cd31d2c2ac51035b", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.21337719190795318, "ground_truth": 0}, {"key": "ddf109b3de6022a4ecd62ee2cd31d2c2ac51035b", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.5331544131683117, "ground_truth": 0}, {"key": "bd92eab23374d95ac4430e2e1a8bf7561c662309", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.3867634291902785, "ground_truth": 0}, {"key": "bd92eab23374d95ac4430e2e1a8bf7561c662309", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.7799928980088233, "ground_truth": 0}, {"key": "bd92eab23374d95ac4430e2e1a8bf7561c662309", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.6279512152486163, "ground_truth": 0}, {"key": "bd92eab23374d95ac4430e2e1a8bf7561c662309", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.6688802583686467, "ground_truth": 0}, {"key": "bd92eab23374d95ac4430e2e1a8bf7561c662309", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.5097643814293898, "ground_truth": 0}, {"key": "d84440effc748f9220c7dde068962e803f566bc7", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.35936415774200847, "ground_truth": 0}, {"key": "d84440effc748f9220c7dde068962e803f566bc7", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.1592173998628316, "ground_truth": 0}, {"key": "d84440effc748f9220c7dde068962e803f566bc7", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.2909808564959685, "ground_truth": 0}, {"key": "d84440effc748f9220c7dde068962e803f566bc7", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.23792986789058684, "ground_truth": 0}, {"key": "d84440effc748f9220c7dde068962e803f566bc7", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.29583988573637515, "ground_truth": 0}, {"key": "e2866f596c85b0191ce812260d23855c70a01192", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.41869688982540604, "ground_truth": 0}, {"key": "e2866f596c85b0191ce812260d23855c70a01192", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.5602526679215534, "ground_truth": 0}, {"key": "e2866f596c85b0191ce812260d23855c70a01192", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.39793841041178374, "ground_truth": 0}, {"key": "e2866f596c85b0191ce812260d23855c70a01192", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.5698526351275384, "ground_truth": 0}, {"key": "e2866f596c85b0191ce812260d23855c70a01192", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.4016878209003985, "ground_truth": 0}, {"key": "4ebd9195bc8c12272b6281a5a610a7b5fb49b8cd", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.34864511400238624, "ground_truth": 0}, {"key": "4ebd9195bc8c12272b6281a5a610a7b5fb49b8cd", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.5312093733894369, "ground_truth": 0}, {"key": "4ebd9195bc8c12272b6281a5a610a7b5fb49b8cd", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.18242550569960442, "ground_truth": 0}, {"key": "4ebd9195bc8c12272b6281a5a610a7b5fb49b8cd", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.3539863217011471, "ground_truth": 0}, {"key": "4ebd9195bc8c12272b6281a5a610a7b5fb49b8cd", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.3433417269493862, "ground_truth": 0}, {"key": "4bd37aa7004cd1fdf1ccb506d2159a2cf26995e0", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.3665897590544522, "ground_truth": 0}, {"key": "4bd37aa7004cd1fdf1ccb506d2159a2cf26995e0", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.20561502381291571, "ground_truth": 0}, {"key": "4bd37aa7004cd1fdf1ccb506d2159a2cf26995e0", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.43206340643993907, "ground_truth": 0}, {"key": "4bd37aa7004cd1fdf1ccb506d2159a2cf26995e0", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.25238402399755144, "ground_truth": 0}, {"key": "4bd37aa7004cd1fdf1ccb506d2159a2cf26995e0", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.5583269876175279, "ground_truth": 0}, {"key": "29b87dc549b8c64b35517e684e79b1da6316bd88", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.44360039932657047, "ground_truth": 0}, {"key": "29b87dc549b8c64b35517e684e79b1da6316bd88", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.1907240174654954, "ground_truth": 0}, {"key": "29b87dc549b8c64b35517e684e79b1da6316bd88", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.28457599178008663, "ground_truth": 0}, {"key": "29b87dc549b8c64b35517e684e79b1da6316bd88", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.29259529633830067, "ground_truth": 0}, {"key": "29b87dc549b8c64b35517e684e79b1da6316bd88", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.3225259896972343, "ground_truth": 0}, {"key": "d2f2fe0b8797b416bae71305c9d1c874e2fdd0cc", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.23934935967789778, "ground_truth": 0}, {"key": "d2f2fe0b8797b416bae71305c9d1c874e2fdd0cc", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.26435837186472594, "ground_truth": 0}, {"key": "d2f2fe0b8797b416bae71305c9d1c874e2fdd0cc", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.20561504023420657, "ground_truth": 0}, {"key": "d2f2fe0b8797b416bae71305c9d1c874e2fdd0cc", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.3090237309675298, "ground_truth": 0}, {"key": "d2f2fe0b8797b416bae71305c9d1c874e2fdd0cc", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.26740815419941044, "ground_truth": 0}, {"key": "0269d39abbea3edadd225fa97d818f5a789b4c72", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.2798284984638501, "ground_truth": 0}, {"key": "0269d39abbea3edadd225fa97d818f5a789b4c72", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.3904758408216061, "ground_truth": 0}, {"key": "0269d39abbea3edadd225fa97d818f5a789b4c72", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.17895587387585093, "ground_truth": 0}, {"key": "0269d39abbea3edadd225fa97d818f5a789b4c72", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.15304215227818949, "ground_truth": 0}, {"key": "0269d39abbea3edadd225fa97d818f5a789b4c72", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.30569733160467766, "ground_truth": 0}, {"key": "394f20c9bee9bc8d0e6a65bac48de57bd9f4733d", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.503906165257995, "ground_truth": 0}, {"key": "394f20c9bee9bc8d0e6a65bac48de57bd9f4733d", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.42059962880479496, "ground_truth": 0}, {"key": "394f20c9bee9bc8d0e6a65bac48de57bd9f4733d", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.15610490536519483, "ground_truth": 0}, {"key": "394f20c9bee9bc8d0e6a65bac48de57bd9f4733d", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.37570647326063394, "ground_truth": 0}, {"key": "394f20c9bee9bc8d0e6a65bac48de57bd9f4733d", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.44939263718611283, "ground_truth": 0}, {"key": "6e63c8b1ae01ab91b4832222edaf4bb461b6c568", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.5544704658855557, "ground_truth": 0}, {"key": "6e63c8b1ae01ab91b4832222edaf4bb461b6c568", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.46295860100450753, "ground_truth": 0}, {"key": "6e63c8b1ae01ab91b4832222edaf4bb461b6c568", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.44746030148772814, "ground_truth": 0}, {"key": "6e63c8b1ae01ab91b4832222edaf4bb461b6c568", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.5583270030239198, "ground_truth": 0}, {"key": "6e63c8b1ae01ab91b4832222edaf4bb461b6c568", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.5214711638770112, "ground_truth": 0}, {"key": "355875856932fd634aaf7c6b26155403aaf15904", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.420599601976129, "ground_truth": 0}, {"key": "355875856932fd634aaf7c6b26155403aaf15904", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.15921739782331792, "ground_truth": 0}, {"key": "355875856932fd634aaf7c6b26155403aaf15904", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.5486734845123039, "ground_truth": 0}, {"key": "355875856932fd634aaf7c6b26155403aaf15904", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.3225259686656262, "ground_truth": 0}, {"key": "355875856932fd634aaf7c6b26155403aaf15904", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.31742627855425176, "ground_truth": 0}, {"key": "999523913d281ab57977d79b644f3879ac4d2e37", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.3242354032655572, "ground_truth": 0}, {"key": "999523913d281ab57977d79b644f3879ac4d2e37", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.16132023809034685, "ground_truth": 0}, {"key": "999523913d281ab57977d79b644f3879ac4d2e37", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.13939638537829874, "ground_truth": 0}, {"key": "999523913d281ab57977d79b644f3879ac4d2e37", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.11838509703602454, "ground_truth": 0}, {"key": "999523913d281ab57977d79b644f3879ac4d2e37", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.2365162165789121, "ground_truth": 0}, {"key": "5f7424604ec11358dc6fdfa47732f90422949041", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.5234203659250489, "ground_truth": 0}, {"key": "5f7424604ec11358dc6fdfa47732f90422949041", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.4359014972963036, "ground_truth": 0}, {"key": "5f7424604ec11358dc6fdfa47732f90422949041", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.3611646880693286, "ground_truth": 0}, {"key": "5f7424604ec11358dc6fdfa47732f90422949041", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.542863267966556, "ground_truth": 0}, {"key": "5f7424604ec11358dc6fdfa47732f90422949041", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.3830641781696754, "ground_truth": 0}, {"key": "fdb2b65b9cb99b7d52559ae647cae293cb5910d3", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.6095241426018901, "ground_truth": 0}, {"key": "fdb2b65b9cb99b7d52559ae647cae293cb5910d3", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.49218811997343437, "ground_truth": 0}, {"key": "fdb2b65b9cb99b7d52559ae647cae293cb5910d3", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.5888891459995687, "ground_truth": 0}, {"key": "fdb2b65b9cb99b7d52559ae647cae293cb5910d3", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.35577488642254357, "ground_truth": 0}, {"key": "fdb2b65b9cb99b7d52559ae647cae293cb5910d3", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.5813031246977798, "ground_truth": 0}, {"key": "f974fe1b3777ffc5756322c0bb3f31a9b23ec09a", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.29746996824426625, "ground_truth": 0}, {"key": "f974fe1b3777ffc5756322c0bb3f31a9b23ec09a", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.27357436681478325, "ground_truth": 0}, {"key": "f974fe1b3777ffc5756322c0bb3f31a9b23ec09a", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.3023910849644997, "ground_truth": 0}, {"key": "f974fe1b3777ffc5756322c0bb3f31a9b23ec09a", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.1233656261148469, "ground_truth": 0}, {"key": "f974fe1b3777ffc5756322c0bb3f31a9b23ec09a", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.28457601372752206, "ground_truth": 0}, {"key": "2930e1a7ac24bce649bfbf5f5971e74515e38a0a", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.47463117668101185, "ground_truth": 0}, {"key": "2930e1a7ac24bce649bfbf5f5971e74515e38a0a", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.37937837132426216, "ground_truth": 0}, {"key": "2930e1a7ac24bce649bfbf5f5971e74515e38a0a", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.5983122240335597, "ground_truth": 0}, {"key": "2930e1a7ac24bce649bfbf5f5971e74515e38a0a", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.4629586415310445, "ground_truth": 0}, {"key": "2930e1a7ac24bce649bfbf5f5971e74515e38a0a", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.43014733536239025, "ground_truth": 0}, {"key": "f5f7571a69e96c1d288d939861b7216c2bdc0ae4", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.6169358195557458, "ground_truth": 0}, {"key": "f5f7571a69e96c1d288d939861b7216c2bdc0ae4", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.20817894153156236, "ground_truth": 0}, {"key": "f5f7571a69e96c1d288d939861b7216c2bdc0ae4", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.3106943731075744, "ground_truth": 0}, {"key": "f5f7571a69e96c1d288d939861b7216c2bdc0ae4", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.40356687165080846, "ground_truth": 0}, {"key": "f5f7571a69e96c1d288d939861b7216c2bdc0ae4", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.4339814609622782, "ground_truth": 0}, {"key": "5f02aa32bd1dc95e47355755398e31550b232f8a", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.14608723790502362, "ground_truth": 0}, {"key": "5f02aa32bd1dc95e47355755398e31550b232f8a", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.4746311957226814, "ground_truth": 0}, {"key": "5f02aa32bd1dc95e47355755398e31550b232f8a", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.4707366009886993, "ground_truth": 0}, {"key": "5f02aa32bd1dc95e47355755398e31550b232f8a", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.32082129784949714, "ground_truth": 0}, {"key": "5f02aa32bd1dc95e47355755398e31550b232f8a", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.3830641528085786, "ground_truth": 0}, {"key": "9177e5ac94f038749e8d4eb526a65461e0f6df4c", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.16667538618704933, "ground_truth": 0}, {"key": "9177e5ac94f038749e8d4eb526a65461e0f6df4c", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.1338674954979246, "ground_truth": 0}, {"key": "9177e5ac94f038749e8d4eb526a65461e0f6df4c", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.0987725868209849, "ground_truth": 0}, {"key": "9177e5ac94f038749e8d4eb526a65461e0f6df4c", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.11279540679608106, "ground_truth": 0}, {"key": "9177e5ac94f038749e8d4eb526a65461e0f6df4c", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.15405755879290775, "ground_truth": 0}, {"key": "f12e4bbb07211de7d43b4e331dc73404aa804562", "model": "xsum_vowelcount_ft_llama", "target_model": "llama", "recognition_score": 0.939470611427396, "ground_truth": 0}, {"key": "f12e4bbb07211de7d43b4e331dc73404aa804562", "model": "xsum_vowelcount_ft_llama", "target_model": "human", "recognition_score": 0.9782188267913997, "ground_truth": 0}, {"key": "f12e4bbb07211de7d43b4e331dc73404aa804562", "model": "xsum_vowelcount_ft_llama", "target_model": "claude", "recognition_score": 0.9693242000170461, "ground_truth": 0}, {"key": "f12e4bbb07211de7d43b4e331dc73404aa804562", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt4", "recognition_score": 0.9445872072181528, "ground_truth": 0}, {"key": "f12e4bbb07211de7d43b4e331dc73404aa804562", "model": "xsum_vowelcount_ft_llama", "target_model": "gpt35", "recognition_score": 0.9746286883171356, "ground_truth": 0}]